PytorchConnectomics
diff --git a/‎connectomics/config/hydra_config.py‎
Lines changed: 29 additions & 7 deletions b/‎connectomics/config/hydra_config.py‎
Lines changed: 29 additions & 7 deletions
diff --git a/‎connectomics/inference/tta.py‎
Lines changed: 112 additions & 5 deletions b/‎connectomics/inference/tta.py‎
Lines changed: 112 additions & 5 deletions
diff --git a/‎connectomics/models/loss/build.py‎
Lines changed: 3 additions & 1 deletion b/‎connectomics/models/loss/build.py‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎connectomics/models/loss/losses.py‎
Lines changed: 36 additions & 1 deletion b/‎connectomics/models/loss/losses.py‎
Lines changed: 36 additions & 1 deletion
@@ -107,6 +107,16 @@ class SystemConfig:
     print_auto_plan: bool = True  # Print auto-planning results
 
 
+@dataclass
+class LossBalancingConfig:
+    """Configuration for adaptive loss weighting."""
+
+    strategy: Optional[str] = None  # None, "uncertainty", or "gradnorm"
+    gradnorm_alpha: float = 0.5
+    gradnorm_lambda: float = 1.0
+    gradnorm_parameter_strategy: str = "last"  # "first", "last", or "all"
+
+
 @dataclass
 class ModelConfig:
     """Model architecture configuration.
@@ -199,6 +209,7 @@ class ModelConfig:
     loss_functions: List[str] = field(default_factory=lambda: ["DiceLoss", "BCEWithLogitsLoss"])
     loss_weights: List[float] = field(default_factory=lambda: [1.0, 1.0])
     loss_kwargs: List[dict] = field(default_factory=lambda: [{}, {}])  # Per-loss kwargs
+    loss_balancing: LossBalancingConfig = field(default_factory=LossBalancingConfig)
 
     # Multi-task learning configuration
     # Defines which output channels correspond to which targets
@@ -881,11 +892,18 @@ class TestTimeAugmentationConfig:
     """Test-time augmentation configuration.
 
     Note: Saving predictions is now handled by SavePredictionConfig.
+
+    Axis Indexing:
+    - flip_axes: Uses full tensor indices (e.g., [2, 3] for H, W in 5D tensor (B, C, D, H, W))
+    - rotation90_axes: Uses spatial-only indices (e.g., [1, 2] for H-W plane where 0=D, 1=H, 2=W)
     """
 
     enabled: bool = False
     flip_axes: Any = (
-        None  # TTA flip strategy: "all" (8 flips), null (no aug), or list like [[0], [1], [2]]
+        None  # TTA flip strategy: "all" (8 flips), null (no aug), or list like [[2], [3]] (full tensor indices)
+    )
+    rotation90_axes: Any = (
+        None  # TTA rotation90 strategy: "all" (3 planes × 4 rotations), null, or list like [[1, 2]] (spatial indices: 0=D, 1=H, 2=W)
     )
     channel_activations: Optional[List[Any]] = (
         None  # Per-channel activations: [[start_ch, end_ch, 'activation'], ...] e.g., [[0, 2, 'softmax'], [2, 3, 'sigmoid'], [3, 4, 'tanh']]
@@ -1058,9 +1076,11 @@ class InferenceConfig:
 @dataclass
 class TestDataConfig:
     """Test data configuration."""
-    test_image: Optional[str] = None
-    test_label: Optional[str] = None
-    test_mask: Optional[str] = None
+    # These can be strings (single file), lists (multiple files), or None
+    # Using Any to support both str and List[str] (OmegaConf doesn't support Union of containers)
+    test_image: Any = None  # str, List[str], or None
+    test_label: Any = None  # str, List[str], or None
+    test_mask: Any = None  # str, List[str], or None
     test_resolution: Optional[List[float]] = None
     test_transpose: Optional[List[int]] = None
     output_path: Optional[str] = None
@@ -1080,9 +1100,11 @@ class TestConfig:
 @dataclass
 class TuneDataConfig:
     """Tuning data configuration."""
-    tune_image: Optional[str] = None
-    tune_label: Optional[str] = None
-    tune_mask: Optional[str] = None
+    # These can be strings (single file), lists (multiple files), or None
+    # Using Any to support both str and List[str] (OmegaConf doesn't support Union of containers)
+    tune_image: Any = None  # str, List[str], or None
+    tune_label: Any = None  # str, List[str], or None
+    tune_mask: Any = None  # str, List[str], or None
     tune_resolution: Optional[List[int]] = None
     # Image transformation (applied to tune images during inference)
     image_transform: ImageTransformConfig = field(default_factory=ImageTransformConfig)
 
@@ -13,6 +13,13 @@
 import torch
 from monai.transforms import Flip
 
+try:
+    from omegaconf import ListConfig
+    HAS_OMEGACONF = True
+except ImportError:
+    HAS_OMEGACONF = False
+    ListConfig = list  # Fallback
+
 
 class TTAPredictor:
     """Encapsulates TTA preprocessing and flip ensemble logic."""
@@ -126,7 +133,7 @@ def _sliding_window_predict(self, inputs: torch.Tensor) -> torch.Tensor:
 
     def predict(self, images: torch.Tensor, mask: Optional[torch.Tensor] = None) -> torch.Tensor:
         """
-        Perform test-time augmentation using flips and ensemble predictions.
+        Perform test-time augmentation using flips, rotations, and ensemble predictions.
 
         Args:
             images: Input volume (B, C, D, H, W) or (B, D, H, W) or (D, H, W)
@@ -153,17 +160,24 @@ def predict(self, images: torch.Tensor, mask: Optional[torch.Tensor] = None) ->
         if getattr(self.cfg.data, "do_2d", False) and images.size(2) == 1:
             images = images.squeeze(2)
 
+        # Get TTA configuration
         if hasattr(self.cfg, "inference") and hasattr(self.cfg.inference, "test_time_augmentation"):
             tta_flip_axes_config = getattr(
                 self.cfg.inference.test_time_augmentation, "flip_axes", None
             )
+            tta_rotation90_axes_config = getattr(
+                self.cfg.inference.test_time_augmentation, "rotation90_axes", None
+            )
         else:
             tta_flip_axes_config = None
+            tta_rotation90_axes_config = None
 
-        if tta_flip_axes_config is None:
+        # If no augmentation configured, run network once
+        if tta_flip_axes_config is None and tta_rotation90_axes_config is None:
             pred = self._run_network(images)
             ensemble_result = self.apply_preprocessing(pred)
         else:
+            # Parse flip axes configuration
             if tta_flip_axes_config == "all" or tta_flip_axes_config == []:
                 if images.dim() == 5:
                     spatial_axes = [1, 2, 3]
@@ -178,34 +192,127 @@ def predict(self, images: torch.Tensor, mask: Optional[torch.Tensor] = None) ->
 
                     for combo in combinations(spatial_axes, r):
                         tta_flip_axes.append(list(combo))
+            elif HAS_OMEGACONF and isinstance(tta_flip_axes_config, ListConfig):
+                # OmegaConf ListConfig - convert to regular list
+                tta_flip_axes_config = [
+                    list(item) if isinstance(item, ListConfig) else item
+                    for item in tta_flip_axes_config
+                ]
+                tta_flip_axes = [[]] + tta_flip_axes_config
             elif isinstance(tta_flip_axes_config, (list, tuple)):
                 tta_flip_axes = [[]] + list(tta_flip_axes_config)
+            elif tta_flip_axes_config is None:
+                tta_flip_axes = [[]]  # No flip augmentation
             else:
                 raise ValueError(
                     f"Invalid tta_flip_axes: {tta_flip_axes_config}. "
                     f"Expected 'all' (8 flips), null (no aug), or list of flip axes."
                 )
 
+            # Parse rotation90 axes configuration
+            # NOTE: We use torch.rot90 which expects full tensor axes
+            # For 5D tensor (B, C, D, H, W): D=2, H=3, W=4
+            # For 4D tensor (B, C, H, W): H=2, W=3
+            # Spatial axes from config (0=D, 1=H, 2=W) need to be converted
+            spatial_offset = 2  # Offset for batch and channel dimensions
+
+            if tta_rotation90_axes_config == "all":
+                if images.dim() == 5:
+                    # For 3D data (B, C, D, H, W), all possible rotation planes
+                    tta_rotation90_axes = [
+                        (2, 3),  # D-H plane
+                        (2, 4),  # D-W plane
+                        (3, 4),  # H-W plane
+                    ]
+                elif images.dim() == 4:
+                    # For 2D data (B, C, H, W), only one rotation plane
+                    tta_rotation90_axes = [(2, 3)]  # H-W plane
+                else:
+                    raise ValueError(f"Unsupported data dimensions: {images.dim()}")
+            elif HAS_OMEGACONF and isinstance(tta_rotation90_axes_config, ListConfig):
+                # OmegaConf ListConfig - convert to list and process
+                tta_rotation90_axes_config = list(tta_rotation90_axes_config)
+                if len(tta_rotation90_axes_config) > 0:
+                    tta_rotation90_axes = []
+                    for axes in tta_rotation90_axes_config:
+                        if HAS_OMEGACONF and isinstance(axes, ListConfig):
+                            axes = list(axes)
+                        if not isinstance(axes, (list, tuple)) or len(axes) != 2:
+                            raise ValueError(
+                                f"Invalid rotation plane: {axes}. Each plane must be a list/tuple of 2 axes."
+                            )
+                        # Convert spatial axes to full tensor axes
+                        full_axes = tuple(a + spatial_offset for a in axes)
+                        tta_rotation90_axes.append(full_axes)
+                else:
+                    tta_rotation90_axes = []
+            elif isinstance(tta_rotation90_axes_config, (list, tuple)) and len(tta_rotation90_axes_config) > 0:
+                # User-specified rotation planes: e.g., [[1, 2], [2, 3]]
+                # Validate that each entry is a list/tuple of length 2
+                tta_rotation90_axes = []
+                for axes in tta_rotation90_axes_config:
+                    if not isinstance(axes, (list, tuple)) or len(axes) != 2:
+                        raise ValueError(
+                            f"Invalid rotation plane: {axes}. Each plane must be a list/tuple of 2 axes."
+                        )
+                    # Convert spatial axes to full tensor axes
+                    full_axes = tuple(a + spatial_offset for a in axes)
+                    tta_rotation90_axes.append(full_axes)
+            elif tta_rotation90_axes_config is None:
+                tta_rotation90_axes = []  # No rotation augmentation
+            else:
+                raise ValueError(
+                    f"Invalid tta_rotation90_axes: {tta_rotation90_axes_config}. "
+                    f"Expected 'all', null (no rotation), or list of rotation planes like [[1, 2]]."
+                )
+
             ensemble_mode = getattr(
                 self.cfg.inference.test_time_augmentation, "ensemble_mode", "mean"
             )
 
             ensemble_result = None
             num_predictions = 0
 
+            # Generate all combinations of (flip_axes, rotation_plane, k_rotations)
+            # For each rotation plane, we try k=0,1,2,3 (0°, 90°, 180°, 270°)
+            augmentation_combinations = []
+
             for flip_axes in tta_flip_axes:
-                if flip_axes:
-                    x_aug = Flip(spatial_axis=flip_axes)(images)
+                if not tta_rotation90_axes:
+                    # No rotation: just add flip augmentation
+                    augmentation_combinations.append((flip_axes, None, 0))
                 else:
-                    x_aug = images
+                    # Add all rotation combinations for this flip
+                    for rotation_plane in tta_rotation90_axes:
+                        for k in range(4):  # 0, 1, 2, 3 rotations (0°, 90°, 180°, 270°)
+                            augmentation_combinations.append((flip_axes, rotation_plane, k))
 
+            # Apply each augmentation combination
+            for flip_axes, rotation_plane, k_rotations in augmentation_combinations:
+                x_aug = images
+
+                # Apply flip augmentation
+                if flip_axes:
+                    x_aug = Flip(spatial_axis=flip_axes)(x_aug)
+
+                # Apply rotation augmentation using torch.rot90
+                if rotation_plane is not None and k_rotations > 0:
+                    x_aug = torch.rot90(x_aug, k=k_rotations, dims=rotation_plane)
+
+                # Run network
                 pred = self._run_network(x_aug)
 
+                # Reverse rotation augmentation
+                if rotation_plane is not None and k_rotations > 0:
+                    pred = torch.rot90(pred, k=-k_rotations, dims=rotation_plane)
+
+                # Reverse flip augmentation
                 if flip_axes:
                     pred = Flip(spatial_axis=flip_axes)(pred)
 
                 pred_processed = self.apply_preprocessing(pred)
 
+                # Ensemble predictions
                 if ensemble_result is None:
                     ensemble_result = pred_processed.clone()
                 else:
 
@@ -28,6 +28,7 @@
     WeightedBCEWithLogitsLoss,
     WeightedMSELoss,
     WeightedMAELoss,
+    SmoothL1Loss,
     GANLoss,
 )
 
@@ -77,6 +78,7 @@ def create_loss(
         'CrossEntropyLoss': CrossEntropyLossWrapper,  # Use wrapper for shape handling
         'MSELoss': nn.MSELoss,
         'L1Loss': nn.L1Loss,
+        'SmoothL1Loss': SmoothL1Loss,
 
         # Custom connectomics losses
         'WeightedBCEWithLogitsLoss': WeightedBCEWithLogitsLoss,
@@ -320,4 +322,4 @@ def list_available_losses() -> List[str]:
     'create_multiclass_segmentation_loss',
     'create_focal_loss',
     'list_available_losses',
-]
+]
@@ -226,6 +226,41 @@ def forward(
             return mae
 
 
+class SmoothL1Loss(nn.Module):
+    """
+    Smooth L1 (Huber) loss with optional tanh activation and spatial weighting.
+
+    Useful for distance transform regression where large outliers should be
+    down-weighted relative to MSE.
+    """
+
+    def __init__(self, beta: float = 1.0, reduction: str = 'mean', tanh: bool = False):
+        super().__init__()
+        self.beta = beta
+        self.reduction = reduction
+        self.tanh = tanh
+
+    def forward(
+        self,
+        pred: torch.Tensor,
+        target: torch.Tensor,
+        weight: torch.Tensor = None,
+    ) -> torch.Tensor:
+        if self.tanh:
+            pred = torch.tanh(pred)
+
+        loss = F.smooth_l1_loss(pred, target, beta=self.beta, reduction='none')
+
+        if weight is not None:
+            loss = loss * weight
+
+        if self.reduction == 'mean':
+            return loss.mean()
+        elif self.reduction == 'sum':
+            return loss.sum()
+        return loss
+
+
 class GANLoss(nn.Module):
     """
     GAN loss for adversarial training.
@@ -316,4 +351,4 @@ def forward(
     'WeightedMSELoss',
     'WeightedMAELoss',
     'GANLoss',
-]
+]