Project-MONAI · mattlin1124 · Aug 3, 2025 · Aug 29, 2025 · coderabbitai · Aug 29, 2025
@@ -60,6 +60,7 @@ def sliding_window_inference(
     *args: Any,
     **kwargs: Any,
 ) -> torch.Tensor | tuple[torch.Tensor, ...] | dict[Any, torch.Tensor]:
+
     """
     Sliding window inference on `inputs` with `predictor`.
 
@@ -134,6 +135,14 @@ def sliding_window_inference(
         - input must be channel-first and have a batch dim, supports N-D sliding window.
 
     """
+
+    # auto transform (N,D,H,W,C) → (N,C,D,H,W)
+    if isinstance(inputs, torch.Tensor) and inputs.ndim == 5 and inputs.shape[-1] in (1, 3, 4):
+        inputs = inputs.permute(0, 4, 1, 2, 3).contiguous()
-    # auto transform (N,D,H,W,C) → (N,C,D,H,W)
-    if isinstance(inputs, torch.Tensor) and inputs.ndim == 5 and inputs.shape[-1] in (1, 3, 4):
-        inputs = inputs.permute(0, 4, 1, 2, 3).contiguous()
+    # Heuristic channel-last -> channel-first normalization with ambiguity guard.
+    if isinstance(inputs, torch.Tensor):
+        if inputs.ndim == 5:  # NDHWC or NCDHW
+            c2, cl = inputs.shape[1], inputs.shape[-1]
+            if cl in (1, 2, 3, 4) and c2 not in (1, 2, 3, 4):
+                inputs = inputs.permute(0, 4, 1, 2, 3).contiguous()
+            elif cl in (1, 2, 3, 4) and c2 in (1, 2, 3, 4) and cl != c2:
+                raise ValueError(
+                    f"Ambiguous channel dimension: dim=1 ({c2}) vs dim=-1 ({cl}). "
+                    "Please reorder explicitly to channel-first."
+                )
+        elif inputs.ndim == 4:  # NHWC or NCHW
+            c2, cl = inputs.shape[1], inputs.shape[-1]
+            if cl in (1, 2, 3, 4) and c2 not in (1, 2, 3, 4):
+                inputs = inputs.permute(0, 3, 1, 2).contiguous()
+            elif cl in (1, 2, 3, 4) and c2 in (1, 2, 3, 4) and cl != c2:
+                raise ValueError(
+                    f"Ambiguous channel dimension: dim=1 ({c2}) vs dim=-1 ({cl}). "
+                    "Please reorder explicitly to channel-first."
+                )
-    # auto transform (N,D,H,W,C) → (N,C,D,H,W)
-    if isinstance(inputs, torch.Tensor) and inputs.ndim == 5 and inputs.shape[-1] in (1, 3, 4):
-        inputs = inputs.permute(0, 4, 1, 2, 3).contiguous()
+    # Heuristic channel-last -> channel-first normalization with ambiguity guard.
+    if isinstance(inputs, torch.Tensor):
+        if inputs.ndim == 5:  # NDHWC or NCDHW
+            c2, cl = inputs.shape[1], inputs.shape[-1]
+            if cl in (1, 2, 3, 4) and c2 not in (1, 2, 3, 4):
+                inputs = inputs.permute(0, 4, 1, 2, 3).contiguous()
+            elif cl in (1, 2, 3, 4) and c2 in (1, 2, 3, 4) and cl != c2:
+                raise ValueError(
+                    f"Ambiguous channel dimension: dim=1 ({c2}) vs dim=-1 ({cl}). "
+                    "Please reorder explicitly to channel-first."
+                )
+        elif inputs.ndim == 4:  # NHWC or NCHW
+            c2, cl = inputs.shape[1], inputs.shape[-1]
+            if cl in (1, 2, 3, 4) and c2 not in (1, 2, 3, 4):
+                inputs = inputs.permute(0, 3, 1, 2).contiguous()
+            elif cl in (1, 2, 3, 4) and c2 in (1, 2, 3, 4) and cl != c2:
+                raise ValueError(
+                    f"Ambiguous channel dimension: dim=1 ({c2}) vs dim=-1 ({cl}). "
+                    "Please reorder explicitly to channel-first."
+                )
+
+
+
+
     buffered = buffer_steps is not None and buffer_steps > 0
     num_spatial_dims = len(inputs.shape) - 2
     if buffered:

@@ -134,6 +134,12 @@ def _compute_tensor(self, y_pred: torch.Tensor, y: torch.Tensor) -> torch.Tensor
         Raises:
             ValueError: when `y_pred` has fewer than three dimensions.
         """
+
+        if isinstance(y_pred, torch.Tensor) and y_pred.ndim == 5 and y_pred.shape[-1] in (1, 3, 4):
+            y_pred = y_pred.permute(0, 4, 1, 2, 3).contiguous()
+        if isinstance(y, torch.Tensor) and y.ndim == 5 and y.shape[-1] in (1, 3, 4):
+            y = y.permute(0, 4, 1, 2, 3).contiguous()
+
-        if isinstance(y_pred, torch.Tensor) and y_pred.ndim == 5 and y_pred.shape[-1] in (1, 3, 4):
-            y_pred = y_pred.permute(0, 4, 1, 2, 3).contiguous()
-        if isinstance(y, torch.Tensor) and y.ndim == 5 and y.shape[-1] in (1, 3, 4):
-            y = y.permute(0, 4, 1, 2, 3).contiguous()
+        # Normalize to channel-first; handle NHWC/NDHWC and fail fast on ambiguity.
+        def _norm(t: torch.Tensor, name: str) -> torch.Tensor:
+            if t.ndim not in (4, 5):
+                return t
+            c2, cl = t.shape[1], t.shape[-1]
+            # num_classes is authoritative when provided
+            if self.num_classes is not None:
+                if c2 in (self.num_classes, 1):
+                    return t
+                if cl in (self.num_classes, 1):
+                    return t.permute(0, t.ndim - 1, *range(1, t.ndim - 1)).contiguous()
+                raise ValueError(
+                    f"{name}: cannot infer channel dimension with num_classes={self.num_classes}: "
+                    f"dim1={c2}, dim-1={cl}."
+                )
+            # Heuristic: prefer the side where channels > 1 and the other side == 1
+            if c2 > 1 and cl == 1:
+                return t  # NCHW[D]
+            if cl > 1 and c2 == 1:
+                return t.permute(0, t.ndim - 1, *range(1, t.ndim - 1)).contiguous()  # NHWC/NDHWC
+            # Ambiguous (both >1 or equal small values) -> fail fast
+            if (c2 > 1 and cl > 1) or (c2 == cl and c2 in (1, 2, 3, 4)):
+                raise ValueError(
+                    f"{name}: ambiguous channel dimension (dim1={c2}, dim-1={cl}). "
+                    "Set num_classes explicitly or reorder the inputs."
+                )
+            return t
+
+        y_pred = _norm(y_pred, "y_pred")
+        y      = _norm(y,      "y")
+        # Inconsistent forms require num_classes
+        if self.num_classes is None and ((y_pred.shape[1] == 1) ^ (y.shape[1] == 1)):
+            raise ValueError(
+                "Inconsistent inputs: label-map vs one-hot but num_classes is None. "
+                "Provide num_classes to disambiguate."
+            )
-        if isinstance(y_pred, torch.Tensor) and y_pred.ndim == 5 and y_pred.shape[-1] in (1, 3, 4):
-            y_pred = y_pred.permute(0, 4, 1, 2, 3).contiguous()
-        if isinstance(y, torch.Tensor) and y.ndim == 5 and y.shape[-1] in (1, 3, 4):
-            y = y.permute(0, 4, 1, 2, 3).contiguous()
+        # Normalize to channel-first; handle NHWC/NDHWC and fail fast on ambiguity.
+        def _norm(t: torch.Tensor, name: str) -> torch.Tensor:
+            if t.ndim not in (4, 5):
+                return t
+            c2, cl = t.shape[1], t.shape[-1]
+            # num_classes is authoritative when provided
+            if self.num_classes is not None:
+                if c2 in (self.num_classes, 1):
+                    return t
+                if cl in (self.num_classes, 1):
+                    return t.permute(0, t.ndim - 1, *range(1, t.ndim - 1)).contiguous()
+                raise ValueError(
+                    f"{name}: cannot infer channel dimension with num_classes={self.num_classes}: "
+                    f"dim1={c2}, dim-1={cl}."
+                )
+            # Heuristic: prefer the side where channels > 1 and the other side == 1
+            if c2 > 1 and cl == 1:
+                return t  # NCHW[D]
+            if cl > 1 and c2 == 1:
+                return t.permute(0, t.ndim - 1, *range(1, t.ndim - 1)).contiguous()  # NHWC/NDHWC
+            # Ambiguous (both >1 or equal small values) -> fail fast
+            if (c2 > 1 and cl > 1) or (c2 == cl and c2 in (1, 2, 3, 4)):
+                raise ValueError(
+                    f"{name}: ambiguous channel dimension (dim1={c2}, dim-1={cl}). "
+                    "Set num_classes explicitly or reorder the inputs."
+                )
+            return t
+
+        y_pred = _norm(y_pred, "y_pred")
+        y      = _norm(y,      "y")
+        # Inconsistent forms require num_classes
+        if self.num_classes is None and ((y_pred.shape[1] == 1) ^ (y.shape[1] == 1)):
+            raise ValueError(
+                "Inconsistent inputs: label-map vs one-hot but num_classes is None. "
+                "Provide num_classes to disambiguate."
+            )
         dims = y_pred.ndimension()
         if dims < 3:
             raise ValueError(f"y_pred should have at least 3 dimensions (batch, channel, spatial), got {dims}.")