davitpapikyan
diff --git a/‎README.md
+25 b/‎README.md
+25
diff --git a/‎config.py
+207 b/‎config.py
+207
diff --git a/‎experiment_configs/t2m_GlobalStandardScaling_Monthly.json
+81 b/‎experiment_configs/t2m_GlobalStandardScaling_Monthly.json
+81
@@ -0,0 +1,25 @@
+# Probabilistic Downscaling of Climate Variables
+
+Project with Colloquium (MA8114)  at TUM: Probabilistic Downscaling of Climate Variables Using Denoising Diffusion Probabilistic Models
+
+Supervisor: Prof. Dr. Rüdiger Westermann (Chair of Computer Graphics and Visualization)\
+Advisor: Kevin Höhlein (Chair of Computer Graphics and Visualization)
+
+---
+
+Downscaling combines methods that are used to infer high-resolution information from 
+low-resolution climate variables. We approach this problem as an image super-resolution 
+task and employ Denoising Diffusion Probabilistic Model to generate finer-scale variables 
+conditioned on coarse-scale information. Experiments are conducted on WeatherBench dataset. 
+Experiments are conducted by analysing temperature at 2 m height above the surface. 
+
+![](results/reverse_diffusion_steps.jpg?raw=true)
+
+---
+
+## References
+
+- Liangwei Jiang (2021) Image-Super-Resolution-via-Iterative-Refinement [[Source code](https://github.com/Janspiry/Image-Super-Resolution-via-Iterative-Refinement#readme)]
+- Song et al. (2021) Score-Based Generative Modeling through Stochastic Differential Equations [[Source code](https://github.com/yang-song/score_sde_pytorch)]
+- Stephan Rasp, Peter D. Dueben, Sebastian Scher, Jonathan A. Weyn, Soukayna Mouatadid, and Nils Thuerey, 2020. WeatherBench: A benchmark dataset for data-driven weather forecasting. arXiv: [WeatherBench: A benchmark dataset for data-driven weather forecasting
+](https://arxiv.org/abs/2002.00469)
@@ -0,0 +1,207 @@
+"""Defines configuration parameters for the whole model and dataset.
+"""
+import argparse
+import json
+import os
+from collections import OrderedDict
+from datetime import datetime
+
+
+def get_current_datetime() -> str:
+    """Converts the current datetime to string.
+
+    Returns:
+        String version of current datetime of the form: %y%m%d_%H%M%S.
+    """
+    return datetime.now().strftime("%y%m%d_%H%M%S")
+
+
+def mkdirs(paths) -> None:
+    """Creates directories represented by paths argument.
+
+    Args:
+        paths: Either list of paths or a single path.
+    """
+    if isinstance(paths, str):
+        os.makedirs(paths, exist_ok=True)
+    else:
+        for path in paths:
+            os.makedirs(path, exist_ok=True)
+
+
+class Config:
+    """Configuration class.
+
+    Attributes:
+        args: Command line aarguments.
+        root: Configuration json file.
+        gpu_ids: A list of GPU IDs.
+        params: A dictionary containing configuration parameters stored in a json file.
+        name: Name of the experiment.
+        phase: Either train or val.
+        distributed: Whether the computation will be distributed among multiple GPUs or not.
+        log: Path to logs.
+        tb_logger: Tensorboard logging directory.
+        results: Validation results directory.
+        checkpoint: Model checkpoints directory.
+        resume_state: The path to load the network.
+        dataset_name: The name of dataset.
+        dataroot: The path to dataset.
+        batch_size: Batch size.
+        num_workers: The number of processes for multi-process data loading.
+        use_shuffle: Either to shuffle the training data or not.
+        train_min_date: Minimum date starting from which to read the data for training.
+        train_max_date: Maximum date until which to read the date for training.
+        val_min_date: Minimum date starting from which to read the data for validation.
+        val_max_date: Maximum date until which to read the date for validation.
+        train_subset_min_date: Minimum date starting from which to read the data for model evaluation on train subset.
+        train_subset_max_date: Maximum date starting until which to read the data for model evaluation on train subset.
+        variables: A list of WeatherBench variables.
+        finetune_norm: Whetehr to fine-tune or train from scratch.
+        in_channel: The number of channels of input tensor of U-Net.
+        out_channel: The number of channels of output tensor of U-Net.
+        inner_channel: Timestep embedding dimension.
+        norm_groups: The number of groups for group normalization.
+        channel_multiplier: A tuple specifying the scaling factors of channels.
+        attn_res: A tuple of spatial dimensions indicating in which resolutions to use self-attention layer.
+        res_blocks: The number of residual blocks.
+        dropout: Dropout probability.
+        init_method: NN weight initialization method. One of normal, kaiming or orthogonal inisializations.
+        train_schedule: Defines the type of beta schedule for training.
+        train_n_timestep: Number of diffusion timesteps for training.
+        train_linear_start: Minimum value of the linear schedule for training.
+        train_linear_end: Maximum value of the linear schedule for training.
+        val_schedule: Defines the type of beta schedule for validation.
+        val_n_timestep: Number of diffusion timesteps for validation.
+        val_linear_start: Minimum value of the linear schedule for validation.
+        val_linear_end: Maximum value of the linear schedule for validation.
+        test_schedule: Defines the type of beta schedule for inference.
+        test_n_timestep: Number of diffusion timesteps for inference.
+        test_linear_start: Minimum value of the linear schedule for inference.
+        test_linear_end: Maximum value of the linear schedule for inference.
+        conditional: Whether to condition on INTERPOLATED image or not.
+        diffusion_loss: Either 'l1' or 'l2'.
+        n_iter: Number of iterations to train.
+        val_freq: Validation frequency.
+        save_checkpoint_freq: Model checkpoint frequency.
+        print_freq: The frequency of displaying training information.
+        n_val_vis: Number of data points to visualize.
+        val_vis_freq: Validation data points visualization frequency.
+        sample_size: Numer of SR images to generate to calculate metrics.
+        optimizer_type: The name of optimization algorithm. Supported values are 'adam', 'adamw'.
+        amsgrad: Whether to use the AMSGrad variant of optimizer.
+        lr: The learning rate.
+        experiments_root: The path to experiment.
+        tranform_monthly: Whether to apply transformation monthly or on the whole dataset.
+        height: U-Net input tensor height value.
+    """
+
+    def __init__(self, args: argparse.Namespace):
+        self.args = args
+        self.root = self.args.config
+        self.gpu_ids = self.args.gpu_ids
+        self.params = {}
+        self.experiments_root = None
+        self.__parse_configs()
+        self.name = self.params["name"]
+        self.phase = self.params["phase"]
+        self.gpu_ids = self.params["gpu_ids"]
+        self.distributed = self.params["distributed"]
+        self.log = self.params["path"]["log"]
+        self.tb_logger = self.params["path"]["tb_logger"]
+        self.results = self.params["path"]["results"]
+        self.checkpoint = self.params["path"]["checkpoint"]
+        self.resume_state = self.params["path"]["resume_state"]
+        self.dataset_name = self.params["data"]["name"]
+        self.dataroot = self.params["data"]["dataroot"]
+        self.batch_size = self.params["data"]["batch_size"]
+        self.num_workers = self.params["data"]["num_workers"]
+        self.use_shuffle = self.params["data"]["use_shuffle"]
+        self.train_min_date = self.params["data"]["train_min_date"]
+        self.train_max_date = self.params["data"]["train_max_date"]
+        self.train_subset_min_date = self.params["data"]["train_subset_min_date"]
+        self.train_subset_max_date = self.params["data"]["train_subset_max_date"]
+        self.tranform_monthly = self.params["data"]["apply_tranform_monthly"]
+        self.transformation = self.params["data"]["transformation"]
+        self.val_min_date = self.params["data"]["val_min_date"]
+        self.val_max_date = self.params["data"]["val_max_date"]
+        self.variables = self.params["data"]["variables"]
+        self.height = self.params["data"]["height"]
+        self.finetune_norm = self.params["model"]["finetune_norm"]
+        self.in_channel = self.params["model"]["unet"]["in_channel"]
+        self.out_channel = self.params["model"]["unet"]["out_channel"]
+        self.inner_channel = self.params["model"]["unet"]["inner_channel"]
+        self.norm_groups = self.params["model"]["unet"]["norm_groups"]
+        self.channel_multiplier = self.params["model"]["unet"]["channel_multiplier"]
+        self.attn_res = self.params["model"]["unet"]["attn_res"]
+        self.res_blocks = self.params["model"]["unet"]["res_blocks"]
+        self.dropout = self.params["model"]["unet"]["dropout"]
+        self.init_method = self.params["model"]["unet"]["init_method"]
+        self.train_schedule = self.params["model"]["beta_schedule"]["train"]["schedule"]
+        self.train_n_timestep = self.params["model"]["beta_schedule"]["train"]["n_timestep"]
+        self.train_linear_start = self.params["model"]["beta_schedule"]["train"]["linear_start"]
+        self.train_linear_end = self.params["model"]["beta_schedule"]["train"]["linear_end"]
+        self.val_schedule = self.params["model"]["beta_schedule"]["val"]["schedule"]
+        self.val_n_timestep = self.params["model"]["beta_schedule"]["val"]["n_timestep"]
+        self.val_linear_start = self.params["model"]["beta_schedule"]["val"]["linear_start"]
+        self.val_linear_end = self.params["model"]["beta_schedule"]["val"]["linear_end"]
+        self.test_schedule = self.params["model"]["beta_schedule"]["test"]["schedule"]
+        self.test_n_timestep = self.params["model"]["beta_schedule"]["test"]["n_timestep"]
+        self.test_linear_start = self.params["model"]["beta_schedule"]["test"]["linear_start"]
+        self.test_linear_end = self.params["model"]["beta_schedule"]["test"]["linear_end"]
+        self.conditional = self.params["model"]["diffusion"]["conditional"]
+        self.diffusion_loss = self.params["model"]["diffusion"]["loss"]
+        self.n_iter = self.params["training"]["epoch_n_iter"]
+        self.val_freq = self.params["training"]["val_freq"]
+        self.save_checkpoint_freq = self.params["training"]["save_checkpoint_freq"]
+        self.print_freq = self.params["training"]["print_freq"]
+        self.n_val_vis = self.params["training"]["n_val_vis"]
+        self.val_vis_freq = self.params["training"]["val_vis_freq"]
+        self.sample_size = self.params["training"]["sample_size"]
+        self.optimizer_type = self.params["training"]["optimizer"]["type"]
+        self.amsgrad = self.params["training"]["optimizer"]["amsgrad"]
+        self.lr = self.params["training"]["optimizer"]["lr"]
+
+    def __parse_configs(self):
+        """Reads configureation json file and stores in params attribute."""
+        json_str = ""
+        with open(self.root, "r") as f:
+            for line in f:
+                json_str = f"{json_str}{line.split('//')[0]}\n"
+
+        self.params = json.loads(json_str, object_pairs_hook=OrderedDict)
+
+        if not self.params["path"]["resume_state"]:
+            self.experiments_root = os.path.join("experiments", f"{self.params['name']}_{get_current_datetime()}")
+        else:
+            self.experiments_root = "/".join(self.params["path"]["resume_state"].split("/")[:-2])
+
+        for key, path in self.params["path"].items():
+            if not key.startswith("resume"):
+                self.params["path"][key] = os.path.join(self.experiments_root, path)
+                mkdirs(self.params["path"][key])
+
+        if self.gpu_ids:
+            self.params["gpu_ids"] = [int(gpu_id) for gpu_id in self.gpu_ids.split(",")]
+            gpu_list = self.gpu_ids
+        else:
+            gpu_list = ",".join(str(x) for x in self.params["gpu_ids"])
+
+        os.environ["CUDA_VISIBLE_DEVICES"] = gpu_list
+        self.params["distributed"] = True if len(gpu_list) > 1 else False
+
+    def __getattr__(self, item):
+        """Returns None when attribute doesn't exist.
+
+        Args:
+            item: Attribute to retrieve.
+
+        Returns:
+            None
+        """
+        return None
+
+    def get_hyperparameters_as_dict(self):
+        """Returns dictionary containg parsed configuration json file.
+        """
+        return self.params
@@ -0,0 +1,81 @@
+{
+    "name": "t2m_GlobalSS_Monthly",
+    "phase": "train",
+    "gpu_ids": [0],
+    "path": {
+        "log": "logs",
+        "tb_logger": "tb_logger",
+        "results": "results",
+        "checkpoint": "checkpoint",
+        "resume_state": null
+    },
+    "data": {
+        "name": "WeatherBench",
+        "dataroot": "/mnt/data/papikyan/WeatherBench/numpy",
+        "batch_size": 16,
+        "num_workers": 4,
+        "use_shuffle": true,
+        "train_min_date": "1979-01-01-00",
+        "train_max_date": "2016-01-01-00",
+        "train_subset_min_date": "2014-01-01-00",
+        "train_subset_max_date": "2016-01-01-00",
+        "transformation": "GlobalStandardScaling",
+        "apply_tranform_monthly": true,
+        "val_min_date": "2016-01-01-00",
+        "val_max_date": "2018-01-01-00",
+        "variables": ["t2m"],
+        "height": 128
+    },
+    "model": {
+        "finetune_norm": false,
+        "unet": {
+            "in_channel": 2,  // This should be equal to the number of variables * 2. Used in only networks.py 121 line.
+            "out_channel": 1, // This should be equal to the number of variables.
+            "inner_channel": 64,
+            "norm_groups": 32,  // 16
+            "channel_multiplier": [1, 2, 4, 8],
+            "attn_res": [16],  // Possible values are 128, 64, 32, 16 and depends on channel_multipliers.
+            "res_blocks": 1,
+            "dropout": 0.7,
+            "init_method": "kaiming"
+        },
+        "beta_schedule": {
+            "train": {
+                "schedule": "cosine",
+                "n_timestep": 2000,
+                "linear_start": 1e-6,
+                "linear_end": 1e-2
+            },
+            "val": {
+                "schedule": "cosine",
+                "n_timestep": 100,
+                "linear_start": 1e-6,
+                "linear_end": 1e-2
+            },
+            "test": {
+                "schedule": "cosine",
+                "n_timestep": 1000,
+                "linear_start": 1e-6,
+                "linear_end": 1e-2
+            }
+        },
+        "diffusion": {
+            "conditional": true,
+            "loss": "l2"
+        }
+    },
+    "training": {
+        "epoch_n_iter": 20000,
+        "val_freq": 2000,
+        "save_checkpoint_freq": 2000,
+        "print_freq": 100,
+        "n_val_vis": 1,
+        "val_vis_freq": 500,
+        "sample_size": 5,
+        "optimizer": {
+            "type": "adam",  // Possible types are ['adam', 'adamw']
+            "amsgrad": false,
+            "lr": 5e-5
+        }
+    }
+}