train_example

simon-donike · simon-donike · commit f1e816c3832b · 2025-11-17T11:36:01.000Z
diff --git a/docs/index.md b/docs/index.md
@@ -4,7 +4,7 @@
 
 | **PyPI** | **Versions** | **Docs & License** | **Tests** | **Reference** |
 |:---------:|:-------------:|:------------------:|:----------:|:--------------:|
-| [![PyPI](https://img.shields.io/pypi/v/opensr-srgan)](https://pypi.org/project/opensr-srgan/) | ![PythonVersion](https://img.shields.io/badge/Python-v3.10%20v3.12-blue.svg)<br>![PLVersion](https://img.shields.io/badge/PyTorchLightning-v1.9%20v2.0-blue.svg) | [![Docs](https://img.shields.io/badge/docs-mkdocs%20material-brightgreen)](https://srgan.opensr.eu)<br>![License: Apache](https://img.shields.io/badge/license-Apache%20License%202.0-blue) | [![CI](https://github.com/simon-donike/SISR-RS-SRGAN/actions/workflows/ci.yml/badge.svg)](https://github.com/simon-donike/SISR-RS-SRGAN/actions/workflows/ci.yml)<br>[![codecov](https://codecov.io/gh/simon-donike/SISR-RS-SRGAN/graph/badge.svg?token=PWZND7MHRR)](https://codecov.io/gh/simon-donike/SISR-RS-SRGAN) | [![arXiv](https://img.shields.io/badge/arXiv-2511.10461-b31b1b.svg)](https://arxiv.org/abs/2511.10461)<br>[![DOI](https://zenodo.org/badge/DOI/10.5281/zenodo.17590993.svg)](https://doi.org/10.5281/zenodo.17590993) |
+| [![PyPI](https://img.shields.io/pypi/v/opensr-srgan)](https://pypi.org/project/opensr-srgan/) | ![PythonVersion](https://img.shields.io/badge/Python-v3.10%20v3.12-blue.svg)<br>![PLVersion](https://img.shields.io/badge/PyTorchLightning-v1.9%20v2.0-blue.svg) | [![Docs](https://img.shields.io/badge/docs-mkdocs%20material-brightgreen)](https://srgan.opensr.eu)<br>![License: Apache](https://img.shields.io/badge/license-Apache%20License%202.0-blue) | [![CI](https://github.com/simon-donike/SISR-RS-SRGAN/actions/workflows/ci.yml/badge.svg)](https://github.com/simon-donike/SISR-RS-SRGAN/actions/workflows/ci.yml)<br>[![codecov](https://codecov.io/github/ESAOpenSR/SRGAN/graph/badge.svg?token=LQ69MIMLVE)](https://codecov.io/github/ESAOpenSR/SRGAN) | [![arXiv](https://img.shields.io/badge/arXiv-2511.10461-b31b1b.svg)](https://arxiv.org/abs/2511.10461)<br>[![DOI](https://zenodo.org/badge/DOI/10.5281/zenodo.17590993.svg)](https://doi.org/10.5281/zenodo.17590993) |
 
 ![Super-resolved Sentinel-2 example](assets/6band_banner.png)
 
diff --git a/opensr_srgan/configs/config_training_example.yaml b/opensr_srgan/configs/config_training_example.yaml
@@ -0,0 +1,130 @@
+# ============================================================================ #
+# ⚙️ GENERAL CONFIGURATION FILE
+# ---------------------------------------------------------------------------- #
+# This file defines all key components for training and evaluating the SR model.
+# Sections: Data, Model, Training, Architecture, Optimization, Scheduling, Logging
+# ============================================================================ #
+
+
+# ============================================================================ #
+# 🗂️ DATA SETTINGS
+# ---------------------------------------------------------------------------- #
+Data:
+  # Loader parameters
+  train_batch_size: 2        # Batch size for training
+  val_batch_size: 2           # Batch size for validation
+  num_workers: 1              # Number of parallel workers for dataloader
+  prefetch_factor: 2          # Samples prefetched per worker (2 is stable default)
+
+  # Dataset configuration
+  dataset_type: 'SISR_WW'       # Choose dataset type: ['cv', 'SPOT6', 'S2_6b', 'SISR_WW']
+  normalization: 'normalise_10k' # Normalization strategy for data processing
+
+
+# ============================================================================ #
+# 🧠 MODEL AND CHECKPOINT SETTINGS
+# ---------------------------------------------------------------------------- #
+Model:
+  in_bands: 4                 # Number of input channels (e.g. RGB-NIR-SWIR etc.)
+  continue_training: False    # Resume full training (PL checkpoint path or False)
+  load_checkpoint: False      # Load weights only (path or False)
+
+
+# ============================================================================ #
+# 🏋️ TRAINING CONFIGURATION
+# ---------------------------------------------------------------------------- #
+Training:
+  # --- Hardware Setup
+  device: "cuda"                # Runtime device backend: ['cuda', 'cpu']
+  gpus: [0]                    # Number of GPUs to use, individually in list form, e.g. [0] or [0,2]
+  # --- General Training Setup
+  max_epochs: 9999            # Maximum number of training epochs
+  val_check_interval: 0.25     # Validate at x percent of epoch (float) or every N steps (int)
+  limit_val_batches: 250      # Limit number of validation batches
+  
+  # --- Pretraining and adversarial setup ---
+  pretrain_g_only: True        # Train generator only for initial phase
+  g_pretrain_steps: 1000      # Number of generator-only warmup steps
+  adv_loss_ramp_steps: 500    # Gradual adversarial weight ramp steps
+  label_smoothing: True        # Discriminator target smoothing (1.0 → 0.9)
+
+  EMA:
+    enabled: False             # Maintain exponential moving average of generator weights
+    decay: 0.999               # EMA decay factor (closer to 1.0 → smoother updates)
+    update_after_step: 0       # Delay EMA updates until this global step (0 = immediate)
+    use_num_updates: True      # Use adaptive decay warmup based on number of updates
+
+  Losses:
+    # --- GAN term ---
+    adv_loss_beta: 0.001       # Final adversarial loss weight after ramp-up - original 0.001
+    adv_loss_schedule: 'cosine'   # Adversarial weight ramp type: ['linear', 'cosine']
+
+    # --- Content loss components (GeneratorContentLoss) ---
+    l1_weight: 1.0             # L1 loss over all bands
+    sam_weight: 0.05           # Spectral Angle Mapper loss
+    perceptual_weight: 0.2     # Perceptual similarity term weight
+    perceptual_metric: 'vgg'   # ['vgg', 'lpips'] - LPIPS requires pip install lpips
+    tv_weight: 0.0             # Total Variation regularization (optional)
+
+    # --- Metric evaluation settings ---
+    max_val: 1.0               # Peak value assumed by PSNR/SSIM after metric preprocessing
+    ssim_win: 11               # SSIM window size (must be odd integer)
+
+
+# ============================================================================ #
+# 🧩 ARCHITECTURAL PARAMETERS
+# ---------------------------------------------------------------------------- #
+# See Docs for archtecture details and suggestions
+Generator:
+  model_type: 'SRResNet'       # Generator family: ['SRResNet', 'stochastic_gan', 'esrgan']
+  block_type: 'rrdb'           # SRResNet block variant: ['standard', 'res', 'rcab', 'rrdb', 'lka']
+  large_kernel_size: 9         # Kernel for head and tail conv layers (SRResNet/stochastic)
+  small_kernel_size: 3         # Kernel for intermediate blocks (SRResNet/stochastic)
+  n_channels: 32               # Feature width (RRDB/ESRGAN uses this as trunk width)
+  n_blocks: 4                 # Residual/attention blocks (ESRGAN: number of RRDB blocks)
+  scaling_factor: 4            # Upscaling factor (e.g., 2×, 4×, 8×)
+  growth_channels: 32          # ESRGAN-specific RRDB growth channels (ignored otherwise)
+  res_scale: 0.2               # Residual scaling used by stochastic/ESRGAN variants
+
+Discriminator:
+  model_type: 'standard'       # Discriminator architecture selector ['standard', 'patchgan', 'esrgan']
+  n_blocks: 2                  # Convolutional depth for SRGAN/PatchGAN (ignored by ESRGAN)
+  base_channels: 32            # ESRGAN discriminator base feature width (ignored otherwise)
+  linear_size: 1024            # Hidden dim of ESRGAN discriminator head (ignored otherwise)
+
+# ============================================================================ #
+# 🧮 OPTIMIZATION SETTINGS
+# ---------------------------------------------------------------------------- #
+Optimizers:
+  optim_g_lr: 1e-4             # Learning rate for Generator
+  optim_d_lr: 1e-6             # Learning rate for Discriminator
+  gradient_clip_val: 1.0        # Gradient clipping value (0 disables clipping)
+  betas: [0.0, 0.99]          # optional
+  eps: 1.0e-7                 # optional
+  weight_decay_g: 0.0         # optional
+  weight_decay_d: 0.0         # optional
+
+# ============================================================================ #
+# 📉 SCHEDULERS AND EARLY STOPPING
+# ---------------------------------------------------------------------------- #
+Schedulers:
+  g_warmup_steps: 10        # Generator warmup LR curve duration in steps (0 disables warmup)
+  g_warmup_type: 'cosine'      # Generator warmup curve: ['cosine', 'linear']
+  metric_g: 'val_metrics/l1'     # Metric monitored for Generator LR scheduler
+  metric_d: 'discriminator/adversarial_loss'     # Metric monitored for Discriminator LR scheduler
+  patience_g: 10              # Patience (epochs) for Generator LR scheduler
+  patience_d: 10              # Patience (epochs) for Discriminator LR scheduler
+  factor_g: 0.5                # LR reduction factor for Generator
+  factor_d: 0.5                # LR reduction factor for Discriminator
+  verbose: True                # Enable scheduler logging output
+
+
+# ============================================================================ #
+# 🧾 LOGGING SETTINGS
+# ---------------------------------------------------------------------------- #
+Logging:
+  num_val_images: 5            # Number of validation images logged per epoch
+  wandb:
+    enabled: False              # Toggle Weights & Biases logging on/off
+    entity: "opensr"           # W&B entity or team name
+    project: "SRGAN_10m"        # W&B project name