Project-MONAI · AlexanderSanin · May 18, 2026 · May 18, 2026 · coderabbitai · May 18, 2026
@@ -131,7 +131,7 @@ def filter(self, record):
     # workaround related to https://github.com/Project-MONAI/MONAI/issues/7575
     if hasattr(torch.cuda.device_count, "cache_clear"):
         torch.cuda.device_count.cache_clear()
-except BaseException:
+except Exception:
     from .utils.misc import MONAIEnvVars
 
     if MONAIEnvVars.debug():

@@ -341,7 +341,7 @@ def _get_all_case_stats(
                     _label_argmax = True  # track if label is argmaxed
                     batch_data[self.label_key] = label.to(device)
                 d = summarizer(batch_data)
-            except BaseException as err:
+            except Exception as err:
                 if "image_meta_dict" in batch_data.keys():
                     filename = batch_data["image_meta_dict"][ImageMetaKey.FILENAME_OR_OBJ]
                 else:
@@ -357,7 +357,7 @@ def _get_all_case_stats(
                                 label = torch.argmax(label, dim=0) if label.shape[0] > 1 else label[0]
                             batch_data[self.label_key] = label.to("cpu")
                         d = summarizer(batch_data)
-                    except BaseException as err:
+                    except Exception as err:
                         logger.info(f"Unable to process data {filename} on {device}. {err}")
                         continue
                 else:

@@ -216,7 +216,7 @@ def __call__(self, pred_param: dict | None = None) -> list:
             if "image_save_func" in param:
                 try:
                     ensemble_preds = self.ensemble_pred(preds, sigmoid=sigmoid)
-                except BaseException:
+                except Exception:
                     ensemble_preds = self.ensemble_pred([_.to("cpu") for _ in preds], sigmoid=sigmoid)
                 res = img_saver(ensemble_preds)
                 # res is the path to the saved results

@@ -59,7 +59,7 @@ def import_bundle_algo_history(
         if best_metric is None:
             try:
                 best_metric = algo.get_score()
-            except BaseException:
+            except Exception:
                 pass
 
         is_trained = best_metric is not None

@@ -541,7 +541,7 @@ def _compute_stats_single_threshold(
         for save_idx, array_index in enumerate(inds):
             precision[save_idx] = pr[array_index]
             th_scores[save_idx] = dt_scores_sorted[array_index]
-    except BaseException:
+    except Exception:
         pass
 
     return recall, np.array(precision), np.array(th_scores)
@@ -200,7 +200,7 @@ def __init__(
             from nnunetv2.utilities.dataset_name_id_conversion import maybe_convert_to_dataset_name
 
             self.dataset_name = maybe_convert_to_dataset_name(int(self.dataset_name_or_id))
-        except BaseException:
+        except Exception:
             logger.warning(
                 f"Dataset with name/ID: {self.dataset_name_or_id} cannot be found in the record. "
                 "Please ignore the message above if you are running the pipeline from a fresh start. "
@@ -278,7 +278,7 @@ def convert_dataset(self):
                 num_input_channels=num_input_channels,
                 output_datafolder=raw_data_foldername,
             )
-        except BaseException as err:
+        except Exception as err:
             logger.warning(f"Input config may be incorrect. Detail info: error/exception message is:\n {err}")
             return
 

@@ -120,7 +120,7 @@ def print_config(file=sys.stdout):
 def _dict_append(in_dict, key, fn):
     try:
         in_dict[key] = fn() if callable(fn) else fn
-    except BaseException:
+    except Exception:
         in_dict[key] = "UNKNOWN for given OS"
 
 

@@ -118,7 +118,7 @@
 from .wsi_datasets import MaskedPatchWSIDataset, PatchWSIDataset, SlidingPatchWSIDataset
 from .wsi_reader import BaseWSIReader, CuCIMWSIReader, OpenSlideWSIReader, TiffFileWSIReader, WSIReader
 
-with contextlib.suppress(BaseException):
+with contextlib.suppress(Exception):
     from multiprocessing.reduction import ForkingPickler
 
     def _rebuild_meta(cls, storage, dtype, metadata):

@@ -545,7 +545,7 @@ def __init__(
                 )
             if cache_roi_weight_map and self.roi_weight_map is None:
                 warnings.warn("cache_roi_weight_map=True, but cache is not created. (dynamic roi_size?)")
-        except BaseException as e:
+        except Exception as e:
             raise RuntimeError(
                 f"roi size {self.roi_size}, mode={mode}, sigma_scale={sigma_scale}, device={device}\n"
                 "Seems to be OOM. Please try smaller patch size or mode='constant' instead of mode='gaussian'."

@@ -162,6 +162,8 @@ def __init__(
         gamma: float = 0.5,
         delta: float = 0.7,
         reduction: LossReduction | str = LossReduction.MEAN,
+        use_softmax: bool = False,
+        use_sigmoid: bool = False,
     ):
         """
         Args:
@@ -170,8 +172,14 @@ def __init__(
             weight : weight for each loss function. Defaults to 0.5.
             gamma : value of the exponent gamma in the definition of the Focal loss. Defaults to 0.5.
             delta : weight of the background. Defaults to 0.7.
-
-
+            reduction: {``"none"``, ``"mean"``, ``"sum"``}
+                Specifies the reduction to apply to the output. Defaults to ``"mean"``.
+            use_softmax: if True, use softmax to transform the input logits into probabilities.
+                Defaults to False. Mutually exclusive with ``use_sigmoid``.
+            use_sigmoid: if True, use sigmoid to transform the input logits into probabilities.
+                Defaults to False. Mutually exclusive with ``use_softmax``.
+                When both ``use_softmax`` and ``use_sigmoid`` are False, the input is assumed
+                to already be probabilities.
 
         Example:
             >>> import torch
@@ -182,22 +190,25 @@ def __init__(
             >>> fl(pred, grnd)
         """
         super().__init__(reduction=LossReduction(reduction).value)
+        if use_softmax and use_sigmoid:
+            raise ValueError("use_softmax and use_sigmoid are mutually exclusive.")
         self.to_onehot_y = to_onehot_y
         self.num_classes = num_classes
         self.gamma = gamma
         self.delta = delta
         self.weight: float = weight
+        self.use_softmax = use_softmax
+        self.use_sigmoid = use_sigmoid
         self.asy_focal_loss = AsymmetricFocalLoss(gamma=self.gamma, delta=self.delta)
         self.asy_focal_tversky_loss = AsymmetricFocalTverskyLoss(gamma=self.gamma, delta=self.delta)
 
-    # TODO: Implement this  function to support multiple classes segmentation
     def forward(self, y_pred: torch.Tensor, y_true: torch.Tensor) -> torch.Tensor:
         """
         Args:
             y_pred : the shape should be BNH[WD], where N is the number of classes.
                 It only supports binary segmentation.
-                The input should be the original logits since it will be transformed by
-                    a sigmoid in the forward function.
+                The input can be raw logits or probabilities depending on ``use_softmax``
+                and ``use_sigmoid`` settings.
             y_true : the shape should be BNH[WD], where N is the number of classes.
                 It only supports binary segmentation.
 
@@ -227,6 +238,11 @@ def forward(self, y_pred: torch.Tensor, y_true: torch.Tensor) -> torch.Tensor:
             else:
                 y_true = one_hot(y_true, num_classes=n_pred_ch)
 
+        if self.use_softmax:
+            y_pred = torch.softmax(y_pred, dim=1)
+        elif self.use_sigmoid:
+            y_pred = torch.sigmoid(y_pred)
+
         asy_focal_loss = self.asy_focal_loss(y_pred, y_true)
         asy_focal_tversky_loss = self.asy_focal_tversky_loss(y_pred, y_true)
 

@@ -41,7 +41,7 @@ def has_ampere_or_later() -> bool:
             major, _ = pynvml.nvmlDeviceGetCudaComputeCapability(handle)
             if major >= 8:
                 return True
-    except BaseException:
+    except Exception:
         pass
     finally:
         pynvml.nvmlShutdown()
@@ -71,7 +71,7 @@ def detect_default_tf32() -> bool:
                 may_enable_tf32 = True
 
         return may_enable_tf32
-    except BaseException:
+    except Exception:
         from monai.utils.misc import MONAIEnvVars
 
         if MONAIEnvVars.debug():

@@ -140,7 +140,7 @@ def test_retina_shape(self, model, input_param, input_shape):
     def test_script(self, model, input_param, input_shape):
         try:
             idx = int(self.id().split("test_script_")[-1])
-        except BaseException:
+        except Exception:
             idx = 0
         idx %= 3
         # test whether support torchscript
@@ -174,7 +174,7 @@ def test_script(self, model, input_param, input_shape):
     def test_onnx(self, model, input_param, input_shape):
         try:
             idx = int(self.id().split("test_onnx_")[-1])
-        except BaseException:
+        except Exception:
             idx = 0
         idx %= 3
         # test whether support torchscript

@@ -61,6 +61,24 @@ def test_with_cuda(self):
         print(output)
         np.testing.assert_allclose(output.detach().cpu().numpy(), 0.0, atol=1e-4, rtol=1e-4)
 
+    def test_use_sigmoid(self):
+        loss = AsymmetricUnifiedFocalLoss(use_sigmoid=True)
+        y_pred = torch.tensor([[[[10.0, -10], [-10, 10.0]]], [[[10.0, -10], [-10, 10.0]]]])
+        y_true = torch.tensor([[[[1.0, 0], [0, 1.0]]], [[[1.0, 0], [0, 1.0]]]])
+        result = loss(y_pred, y_true)
+        self.assertTrue(result.item() >= 0)
+
+    def test_use_softmax(self):
+        loss = AsymmetricUnifiedFocalLoss(use_softmax=True)
+        y_pred = torch.tensor([[[[10.0, -10], [-10, 10.0]]], [[[10.0, -10], [-10, 10.0]]]])
+        y_true = torch.tensor([[[[1.0, 0], [0, 1.0]]], [[[1.0, 0], [0, 1.0]]]])
+        result = loss(y_pred, y_true)
+        self.assertTrue(result.item() >= 0)
+
+    def test_mutually_exclusive(self):
+        with self.assertRaises(ValueError):
+            AsymmetricUnifiedFocalLoss(use_softmax=True, use_sigmoid=True)
+
 
 if __name__ == "__main__":
     unittest.main()
@@ -249,7 +249,7 @@ def tearDown(self):
         if os.path.exists(self.tmp_ckpt_filename):
             try:
                 os.remove(self.tmp_ckpt_filename)
-            except BaseException:
+            except Exception:
                 pass
 
     @parameterized.expand(TEST_CASES)

@@ -241,7 +241,7 @@ def is_tf32_env():
                 a_full = torch.randn(1024, 1024, dtype=torch.double, device="cuda", generator=g_gpu)
                 b_full = torch.randn(1024, 1024, dtype=torch.double, device="cuda", generator=g_gpu)
                 _tf32_enabled = (a_full.float() @ b_full.float() - a_full @ b_full).abs().max().item() > 0.001  # 0.1713
-            except BaseException:
+            except Exception:
                 pass
         print(f"tf32 enabled: {_tf32_enabled}")
     return _tf32_enabled