Merge pull request #604 from valhassan/601-maintenance-manage-geo-deep-learning-with-uv-by-astral

valhassan · web-flow · commit a2410c8d789b · 2025-11-10T15:49:18.000-05:00
601 maintenance manage geo deep learning with uv by astral
diff --git a/.gitignore b/.gitignore
@@ -2,6 +2,9 @@
 *.idea**
 *.vscode**
 
+# Distribution / packaging
+*.egg-info/
+
 # Specific folders name
 waterloo_subset_512/
 mlruns/
diff --git a/README.md b/README.md
@@ -4,17 +4,18 @@ A PyTorch Lightning-based framework for geospatial deep learning with multi-sens
 
 ## Overview
 
-Geo Deep Learning (GDL) is a modular framework designed for semantic segmentation of geospatial imagery using state-of-the-art deep learning models. Built on PyTorch Lightning, it provides efficient training pipelines for multi-sensor data with WebDataset support.
+Geo Deep Learning (GDL) is a modular framework designed to support a wide range of geospatial deep learning tasks such as semantic segmentation, object detection, and regression.
+Built on PyTorch Lightning, it provides efficient training pipelines for multi-sensor data.
 
 ## Features
 
-- **Multi-sensor Support**: Handle multiple Earth observation sensors simultaneously
-- **Modular Architecture**: Encoder-neck-decoder pattern with interchangeable components
-- **WebDataset Integration**: Efficient large-scale data loading and processing
-- **Multiple Model Types**: UNet++, SegFormer, DOFA (Dynamic-one-for-all Architecture)
-- **Distributed Training**: Multi-GPU training with DDP strategy
-- **MLflow Logging**: Comprehensive experiment tracking and model versioning
-- **Flexible Data Pipeline**: Support for CSV and WebDataset formats
+- **Multi-sensor Support**: Handle multiple Earth observation sensors simultaneously.
+- **Modular Architecture**: Encoder-neck-decoder pattern with interchangeable components.
+- **WebDataset Integration**: Efficient large-scale data loading and processing.
+- **Multiple Model Types**: UNet++, SegFormer, DOFA (Dynamic-one-for-all Architecture).
+- **Distributed Training**: Multi-GPU training with supported strategies.
+- **MLflow Logging**: Comprehensive experiment tracking and model versioning.
+- **Flexible Data Pipeline**: Support for CSV and WebDataset formats.
 
 ## Architecture
 
@@ -31,23 +32,47 @@ Geo Deep Learning (GDL) is a modular framework designed for semantic segmentatio
 └── samplers/              # Custom data sampling strategies
 ```
 
+## Requirements
+- Install [uv](https://docs.astral.sh/uv/) package manager for your OS.
+
 ## Quick Start
 
+1. **Clone the repository:**
 ```bash
-git clone <repository-url>
+git clone https://github.com/NRCan/geo-deep-learning.git
 cd geo-deep-learning
 ```
+2. **Install dependencies:**
 
-### Training
+For **GPU training** with CUDA 12.8:
+```bash
+uv sync --extra cu128
+```
 
+For **CPU-only** training:
 ```bash
-# Single GPU training
-python geo_deep_learning/train.py fit --config configs/dofa_config_RGB.yaml
+uv sync --extra cpu
 ```
+This creates a virtual environment in `.venv/` and installs all dependencies.
+
+3. **Activate the environment:**
+```bash
+# Linux/macOS
+source .venv/bin/activate
+
+# Windows
+.venv\Scripts\activate
+```
+
+Or use `uv run` to execute commands without manual activation:
+```bash
+uv run python geo_deep_learning/train.py fit --config configs/dofa_config_RGB.yaml
+```
+**Note:** *If you prefer to use conda or another environment manager, you can generate a `requirements.txt` file from the dependencies listed in `pyproject.toml` for manual installation.*
 
 ### Configuration
 
-Models are configured via YAML files in `configs/`:
+Models are configured via YAML files in the `configs/` directory:
 
 ```yaml
 model:
@@ -65,54 +90,53 @@ data:
     sensor_configs_path: "path/to/sensor_configs.yaml"
     batch_size: 16
     patch_size: [512, 512]
+
+trainer:
+  max_epochs: 100
+  precision: 16-mixed
+  accelerator: gpu
+  devices: 1
 ```
 
 ## Supported Models
 
-### DOFA (Domain-Oriented Foundation Architecture)
-- **DOFA Base**: 768-dim embeddings, suitable for most tasks
-- **DOFA Large**: 1024-dim embeddings, higher capacity
-- Multi-scale feature extraction with UperNet decoder
-- Support for wavelength-specific processing
-
 ### UNet++
-- Classic U-Net architecture with dense skip connections
-- Multiple encoder backbones (ResNet, EfficientNet, etc.)
-- Optimized for medical and satellite imagery
+- Classic U-Net architecture with dense skip connections.
+- Multiple encoder backbones (ResNet, EfficientNet, etc.).
+- Available through segmentation-models-pytorch.
 
 ### SegFormer
-- Transformer-based architecture for semantic segmentation
-- Hierarchical feature representation
-- Efficient attention mechanisms
+- Transformer-based architecture for semantic segmentation.
+- Hierarchical feature representation (MixTransformer encoder).
+- Multiple model sizes (B0-B5).
+
+### DOFA (Dynamic One-For-All foundation model)
+- **DOFA Base**: 768-dim embeddings, suitable for most tasks.
+- **DOFA Large**: 1024-dim embeddings, higher capacity.
+- Multi-scale feature extraction with UperNet decoder.
+- Support for wavelength-specific processing.
+
 
 ## Data Pipeline
 
 ### Multi-Sensor DataModule
-- **Sensor Mixing**: Combine data from multiple sensors during training
-- **WebDataset Format**: Efficient sharded data storage and loading
-- **Patch-based Processing**: Configurable patch sizes (default: 512x512)
-- **Data Augmentation**: Built-in augmentation pipeline
+- **Sensor Mixing**: Combine data from multiple sensors during training.
+- **WebDataset Format**: Efficient sharded data storage and loading.
 
 ### Supported Data Formats
-- **WebDataset**: Sharded tar files with metadata
-- **CSV**: Traditional CSV with file paths and labels
-- **Multi-sensor**: YAML configuration for sensor-specific settings
+- **WebDataset**: Sharded tar files with metadata.
+- **CSV**: Traditional CSV with file paths and labels.
+- **Multi-sensor**: YAML configuration for sensor-specific settings.
 
 ## Training Features
-
-- **Mixed Precision**: 16-bit mixed precision training
-- **Gradient Clipping**: Configurable gradient clipping
-- **Early Stopping**: Automatic training termination
-- **Model Checkpointing**: Best model saving based on validation metrics
-- **Visualization**: Built-in prediction visualization callbacks
-
-## Distributed Training
-
-The framework supports multi-GPU training with:
-- DDP (Distributed Data Parallel) strategy
-- Automatic mixed precision
-- Synchronized batch normalization
-- Efficient NCCL communication
+- **Large-scale training**: Distributed training strategies enabled with pytorch lightning.
+- **Mixed Precision Training**: 16-bit mixed precision for faster training.
+- **Gradient Clipping**: Configurable gradient clipping for stability.
+- **Early Stopping**: Automatic training termination based on validation metrics.
+- **Model Checkpointing**: Saves best models based on validation performance.
+- **MLflow Integration**: Experiment tracking, metrics logging, and model registry.
+- **Visualization Callbacks**: Built-in prediction visualization during training.
+- **Learning Rate Scheduling**: Cosine annealing, step decay, and more.
 
 ## Development
 
diff --git a/geo_deep_learning/config/__init__.py b/geo_deep_learning/config/__init__.py
@@ -0,0 +1 @@
+"""Logging configuration."""
diff --git a/geo_deep_learning/config/log_config.yaml b/geo_deep_learning/config/log_config.yaml
diff --git a/geo_deep_learning/config/logging_config.py b/geo_deep_learning/config/logging_config.py
diff --git a/geo_deep_learning/models/encoders/mix_transformer.py b/geo_deep_learning/models/encoders/mix_transformer.py
@@ -7,11 +7,12 @@
 
 import torch
 import torch.nn.functional as fn
-from models.segmentation.base import EncoderMixin
 from timm.layers import DropPath, to_2tuple, trunc_normal_
 from torch import Tensor, nn
 from torch.utils import model_zoo
 
+from geo_deep_learning.models.segmentation.base import EncoderMixin
+
 
 class Mlp(nn.Module):
     """MLP module."""
diff --git a/geo_deep_learning/models/segmentation/segformer.py b/geo_deep_learning/models/segmentation/segformer.py
@@ -2,8 +2,12 @@
 
 import torch
 import torch.nn.functional as fn
-from models.decoders.segformer_mlp import Decoder
-from models.encoders.mix_transformer import DynamicMixTransformer, get_encoder
+
+from geo_deep_learning.models.decoders.segformer_mlp import Decoder
+from geo_deep_learning.models.encoders.mix_transformer import (
+    DynamicMixTransformer,
+    get_encoder,
+)
 
 from .base import BaseSegmentationModel
 
diff --git a/geo_deep_learning/tasks_with_models/segmentation_dofa.py b/geo_deep_learning/tasks_with_models/segmentation_dofa.py
@@ -16,10 +16,10 @@
 from torchmetrics.segmentation import MeanIoU
 from torchmetrics.wrappers import ClasswiseWrapper
 
+from geo_deep_learning.models.segmentation.dofa import DOFASegmentationModel
+from geo_deep_learning.tools.visualization import visualize_prediction
 from geo_deep_learning.utils.models import load_weights_from_checkpoint
 from geo_deep_learning.utils.tensors import denormalization
-from models.segmentation.dofa import DOFASegmentationModel
-from tools.visualization import visualize_prediction
 
 # Ignore warning about default grid_sample and affine_grid behavior triggered by kornia
 warnings.filterwarnings(
diff --git a/geo_deep_learning/tasks_with_models/segmentation_segformer.py b/geo_deep_learning/tasks_with_models/segmentation_segformer.py
@@ -16,10 +16,10 @@
 from torchmetrics.segmentation import MeanIoU
 from torchmetrics.wrappers import ClasswiseWrapper
 
+from geo_deep_learning.models.segmentation.segformer import SegFormerSegmentationModel
+from geo_deep_learning.tools.visualization import visualize_prediction
 from geo_deep_learning.utils.models import load_weights_from_checkpoint
 from geo_deep_learning.utils.tensors import denormalization
-from models.segmentation.segformer import SegFormerSegmentationModel
-from tools.visualization import visualize_prediction
 
 warnings.filterwarnings(
     "ignore",
diff --git a/geo_deep_learning/train.py b/geo_deep_learning/train.py
@@ -7,7 +7,7 @@
 from lightning.pytorch.cli import ArgsType, LightningCLI
 from lightning.pytorch.loggers import MLFlowLogger
 
-from configs import logging_config  # noqa: F401
+from geo_deep_learning.config import logging_config  # noqa: F401
 from geo_deep_learning.tools.mlflow_logger import LoggerSaveConfigCallback
 
 logger = logging.getLogger(__name__)
diff --git a/pyproject.toml b/pyproject.toml
@@ -4,39 +4,89 @@ build-backend = "setuptools.build_meta"
 
 [project]
 name = "geo-deep-learning"
-version = "0.1.0a0"
-description = "Geospatial deep learning framework for segmentation tasks"
+version = "0.1.0"
+description = "Geospatial deep learning framework for geospatial tasks"
 readme = "README.md"
+requires-python = ">=3.12.0,<3.13"
 authors = [
   { name = "Victor Alhassan", email = "victor.alhassan@NRCan-RNCan.gc.ca" },
   { name = "Luca Romanini", email = "luca.romanini@NRCan-RNCan.gc.ca" },
 ]
-requires-python = ">=3.10"
 license = { file = "LICENSE" }
 classifiers = [
     "Development Status :: 3 - Alpha",
     "Intended Audience :: Science/Research",
     "License :: OSI Approved :: MIT License",
-    "Programming Language :: Python :: 3.10",
+    "Programming Language :: Python :: 3.12",
     "Topic :: Scientific/Engineering :: Artificial Intelligence",
     "Topic :: Scientific/Engineering :: GIS",
 ]
 keywords = ["pytorch", "deep learning", "machine learning", "remote sensing", "satellite imagery", "earth observation", "geospatial"]
 
-# Dependencies are pulled from requirements.txt
-dynamic = ["dependencies"]
-
-[tool.setuptools.dynamic]
-dependencies = { file = ["requirements.txt"] }
+dependencies = [
+  "lightning>=2.0.0",
+  "torchmetrics>=1.0.0",
+  "kornia>=0.7.0",
+  "timm>=0.9.0",
+  "segmentation-models-pytorch>=0.3.3",
+  "webdataset>=0.2.0",
+  "torchgeo>=0.5.0",
+  "rasterio>=1.3.0",
+  "numpy>=1.24.0",
+  "pandas>=2.0.0",
+  "matplotlib>=3.7.0",
+  "mlflow>=2.0.0",
+  "colorlog>=6.7.0",
+  "PyYAML>=6.0",
+  "jsonargparse[all]>=4.27.7",
+  "jupyterlab>=4.0.0",
+  ]
 
 [project.optional-dependencies]
-dev = ["pytest", "ruff", "pre-commit"]
+cpu = ["torch>=2.7.0", "torchvision>=0.22.0",]
+cu128 = ["torch>=2.7.0", "torchvision>=0.22.0",]
+dev = ["pytest", "ruff", "pre-commit",]
 
 [project.urls]
 Homepage = "https://github.com/NRCan/geo-deep-learning"
 Repository = "https://github.com/NRCan/geo-deep-learning"
 Issues = "https://github.com/NRCan/geo-deep-learning/issues"
 
+[tool.setuptools.packages.find]
+include = ["geo_deep_learning*"]
+
+# --------------------------
+# UV configuration
+# --------------------------
+
+[tool.uv]
+conflicts = [
+  [
+    { extra = "cpu" },
+    { extra = "cu128" },
+  ],
+]
+
+[tool.uv.sources]
+torch = [
+  { index = "pytorch-cpu", extra = "cpu" },
+  { index = "pytorch-cu128", extra = "cu128" },
+]
+torchvision = [
+  { index = "pytorch-cpu", extra = "cpu" },
+  { index = "pytorch-cu128", extra = "cu128" },
+]
+
+[[tool.uv.index]]
+name = "pytorch-cpu"
+url = "https://download.pytorch.org/whl/cpu"
+explicit = true
+
+[[tool.uv.index]]
+name = "pytorch-cu128"
+url = "https://download.pytorch.org/whl/cu128"
+explicit = true
+
 
 # --------------------------
 # Ruff configuration
@@ -53,8 +103,9 @@ exclude = [
 src = ["geo_deep_learning"]
 line-length = 88
 indent-width = 4
-target-version = "py310"
+target-version = "py312"
 
+[tool.ruff.lint]
 # Enable full PEP 8 + modern checks
 select = ["ALL"]
 ignore = [
@@ -65,11 +116,8 @@ ignore = [
     "ERA001", # ignore commented out code
     "TC002", "TC003" # allow imports in type annotations without TYPE_CHECKING
 ]
-
-[tool.ruff.lint]
 fixable = ["ALL"]
 unfixable = []
-
 dummy-variable-rgx = "^(_+|(_+[a-zA-Z0-9_]*[a-zA-Z0-9]+?))$"
 
 [tool.ruff.format]
@@ -79,7 +127,6 @@ skip-magic-trailing-comma = false
 line-ending = "auto"
 
 [tool.ruff.lint.isort]
-# Treat both the package and legacy alias names as first-party
 known-first-party = [
   "geo_deep_learning",
   "tools",