Fix(backend/torch): Resolve MPS broadcast crash in binary_crossentropy

Mithil27360 · Mithil27360 · commit dce518f393f3 · 2025-11-02T16:59:45.000+05:30
diff --git a/keras/src/backend/torch/nn.py b/keras/src/backend/torch/nn.py
@@ -755,12 +755,27 @@ def binary_crossentropy(target, output, from_logits=False):
     target = convert_to_tensor(target)
     output = convert_to_tensor(output)
 
+    # Fix for MPS broadcast error:
+    # The backward pass for BCELoss on MPS fails if inputs have a
+    # trailing dim of 1 (e.g., (B, T, 1) or (B, H, W, 1)).
+    # Squeezing to (B, T) or (B, H, W) resolves the conflict.
+    # .contiguous() is added to force a new tensor copy.
+    if (
+        target.ndim > 1
+        and output.ndim == target.ndim
+        and target.shape[-1] == 1
+        and output.shape[-1] == 1
+    ):
+        target = torch.squeeze(target, -1).contiguous()
+        output = torch.squeeze(output, -1).contiguous()
+
     if target.shape != output.shape:
         raise ValueError(
             "Arguments `target` and `output` must have the same shape. "
             "Received: "
             f"target.shape={target.shape}, output.shape={output.shape}"
         )
+
     # By default, PyTorch, does reduction of `sum` over all rows,
     # change reduction to `none` to keep dim
     if from_logits: