keras-team
diff --git a/‎keras/api/_tf_keras/keras/ops/__init__.py‎
Lines changed: 1 addition & 0 deletions b/‎keras/api/_tf_keras/keras/ops/__init__.py‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎keras/api/_tf_keras/keras/ops/numpy/__init__.py‎
Lines changed: 1 addition & 0 deletions b/‎keras/api/_tf_keras/keras/ops/numpy/__init__.py‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎keras/api/ops/__init__.py‎
Lines changed: 1 addition & 0 deletions b/‎keras/api/ops/__init__.py‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎keras/api/ops/numpy/__init__.py‎
Lines changed: 1 addition & 0 deletions b/‎keras/api/ops/numpy/__init__.py‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎keras/src/backend/common/backend_utils.py‎
Lines changed: 22 additions & 6 deletions b/‎keras/src/backend/common/backend_utils.py‎
Lines changed: 22 additions & 6 deletions
diff --git a/‎keras/src/backend/common/backend_utils_test.py‎
Lines changed: 19 additions & 0 deletions b/‎keras/src/backend/common/backend_utils_test.py‎
Lines changed: 19 additions & 0 deletions
diff --git a/‎keras/src/backend/common/variables.py‎
Lines changed: 24 additions & 13 deletions b/‎keras/src/backend/common/variables.py‎
Lines changed: 24 additions & 13 deletions
@@ -215,6 +215,7 @@
 from keras.src.ops.numpy import kaiser as kaiser
 from keras.src.ops.numpy import kron as kron
 from keras.src.ops.numpy import lcm as lcm
+from keras.src.ops.numpy import ldexp as ldexp
 from keras.src.ops.numpy import left_shift as left_shift
 from keras.src.ops.numpy import less as less
 from keras.src.ops.numpy import less_equal as less_equal
 
@@ -101,6 +101,7 @@
 from keras.src.ops.numpy import kaiser as kaiser
 from keras.src.ops.numpy import kron as kron
 from keras.src.ops.numpy import lcm as lcm
+from keras.src.ops.numpy import ldexp as ldexp
 from keras.src.ops.numpy import left_shift as left_shift
 from keras.src.ops.numpy import less as less
 from keras.src.ops.numpy import less_equal as less_equal
 
@@ -215,6 +215,7 @@
 from keras.src.ops.numpy import kaiser as kaiser
 from keras.src.ops.numpy import kron as kron
 from keras.src.ops.numpy import lcm as lcm
+from keras.src.ops.numpy import ldexp as ldexp
 from keras.src.ops.numpy import left_shift as left_shift
 from keras.src.ops.numpy import less as less
 from keras.src.ops.numpy import less_equal as less_equal
 
@@ -101,6 +101,7 @@
 from keras.src.ops.numpy import kaiser as kaiser
 from keras.src.ops.numpy import kron as kron
 from keras.src.ops.numpy import lcm as lcm
+from keras.src.ops.numpy import ldexp as ldexp
 from keras.src.ops.numpy import left_shift as left_shift
 from keras.src.ops.numpy import less as less
 from keras.src.ops.numpy import less_equal as less_equal
 
@@ -96,13 +96,13 @@ def _convert_conv_transpose_padding_args_from_keras_to_torch(
         )
 
     if torch_output_padding >= stride:
-        raise ValueError(
-            f"The padding arguments (padding={padding}) and "
-            f"output_padding={output_padding}) lead to a Torch "
-            f"output_padding ({torch_output_padding}) that is greater than "
-            f"strides ({stride}). This is not supported. You can change the "
-            f"padding arguments, kernel or stride, or run on another backend. "
+        warnings.warn(
+            f"Torch backend requires output_padding < stride. "
+            f"Clamping output_padding {torch_output_padding} -> {stride - 1} "
+            f"for stride {stride}.",
+            UserWarning,
         )
+        torch_output_padding = stride - 1
 
     return torch_padding, torch_output_padding
 
@@ -184,6 +184,22 @@ def compute_conv_transpose_padding_args_for_torch(
         torch_paddings.append(torch_padding)
         torch_output_paddings.append(torch_output_padding)
 
+    # --- FIX FOR TORCH CONSTRAINT: output_padding < stride ---
+    corrected_output_paddings = []
+    for s, op in zip(
+        strides
+        if isinstance(strides, (list, tuple))
+        else [strides] * num_spatial_dims,
+        torch_output_paddings,
+    ):
+        max_allowed = max(0, s - 1)
+        if op > max_allowed:
+            corrected_output_paddings.append(max_allowed)
+        else:
+            corrected_output_paddings.append(op)
+
+    torch_output_paddings = corrected_output_paddings
+
     return torch_paddings, torch_output_paddings
 
 
 
@@ -170,6 +170,25 @@ def test_valid_padding_with_output_padding(self):
         self.assertEqual(torch_padding, 0)
         self.assertEqual(torch_output_padding, 1)
 
+    def test_output_padding_clamped_for_torch_constraint(self):
+        """Test that output_padding is clamped
+        when >= stride (Torch constraint).
+        """
+        (
+            torch_paddings,
+            torch_output_paddings,
+        ) = compute_conv_transpose_padding_args_for_torch(
+            input_shape=(1, 8, 8, 8, 16),  # any shape
+            kernel_shape=(2, 2, 2, 16, 32),  # Keras kernel shape
+            strides=1,
+            padding="same",
+            output_padding=1,  # Keras wants this
+            dilation_rate=1,
+        )
+        # Torch expects output_padding < stride (1)
+        # so output_padding should be clamped to 0
+        self.assertEqual(torch_output_paddings, [0, 0, 0])
+
 
 class GetOutputShapeGivenTFPaddingTest(test_case.TestCase):
     def test_valid_padding_without_output_padding(self):
 
@@ -276,7 +276,7 @@ def value(self):
         return self._maybe_autocast(self._value)
 
     def assign(self, value):
-        value = self._convert_to_tensor(value, dtype=self.dtype)
+        value = self._convert_to_tensor(value, dtype=self._dtype)
         if not shape_equal(value.shape, self.shape):
             raise ValueError(
                 "The shape of the target variable and "
@@ -599,7 +599,6 @@ def standardize_shape(shape):
                 # `tf.TensorShape` may contain `Dimension` objects.
                 # We need to convert the items in it to either int or `None`
                 shape = shape.as_list()
-        shape = tuple(shape)
 
     if config.backend() == "jax":
         # Replace `_DimExpr` (dimension expression) with None
@@ -609,25 +608,37 @@ def standardize_shape(shape):
             None if jax_export.is_symbolic_dim(d) else d for d in shape
         )
 
-    if config.backend() == "torch":
-        # `shape` might be `torch.Size`. We need to convert the items in it to
-        # either int or `None`
-        shape = tuple(map(lambda x: int(x) if x is not None else None, shape))
-
-    for e in shape:
-        if e is None:
+    # Handle dimensions that are not ints and not None, verify they're >= 0.
+    standardized_shape = []
+    for d in shape:
+        if d is None:
+            standardized_shape.append(d)
             continue
-        if not is_int_dtype(type(e)):
+
+        # Reject these even if they can be cast to int successfully.
+        if isinstance(d, (str, float)):
             raise ValueError(
                 f"Cannot convert '{shape}' to a shape. "
-                f"Found invalid entry '{e}' of type '{type(e)}'. "
+                f"Found invalid dimension '{d}' of type '{type(d)}'. "
             )
-        if e < 0:
+
+        try:
+            # Cast numpy scalars, tf constant tensors, etc.
+            d = int(d)
+        except Exception as e:
+            raise ValueError(
+                f"Cannot convert '{shape}' to a shape. "
+                f"Found invalid dimension '{d}' of type '{type(d)}'. "
+            ) from e
+        if d < 0:
             raise ValueError(
                 f"Cannot convert '{shape}' to a shape. "
                 "Negative dimensions are not allowed."
             )
-    return shape
+        standardized_shape.append(d)
+
+    # This also turns subclasses of `tuple` (e.g. `torch.Size`) to plain tuple.
+    return tuple(standardized_shape)
 
 
 def shape_equal(a_shape, b_shape):