james77777778
diff --git a/‎keras/api/_tf_keras/keras/ops/__init__.py‎
Lines changed: 1 addition & 0 deletions b/‎keras/api/_tf_keras/keras/ops/__init__.py‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎keras/api/ops/__init__.py‎
Lines changed: 1 addition & 0 deletions b/‎keras/api/ops/__init__.py‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎keras/src/backend/jax/core.py‎
Lines changed: 4 additions & 0 deletions b/‎keras/src/backend/jax/core.py‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎keras/src/backend/jax/math.py‎
Lines changed: 5 additions & 5 deletions b/‎keras/src/backend/jax/math.py‎
Lines changed: 5 additions & 5 deletions
diff --git a/‎keras/src/backend/jax/numpy.py‎
Lines changed: 2 additions & 2 deletions b/‎keras/src/backend/jax/numpy.py‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎keras/src/backend/jax/trainer.py‎
Lines changed: 1 addition & 0 deletions b/‎keras/src/backend/jax/trainer.py‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎keras/src/backend/numpy/core.py‎
Lines changed: 26 additions & 4 deletions b/‎keras/src/backend/numpy/core.py‎
Lines changed: 26 additions & 4 deletions
diff --git a/‎keras/src/backend/numpy/numpy.py‎
Lines changed: 4 additions & 2 deletions b/‎keras/src/backend/numpy/numpy.py‎
Lines changed: 4 additions & 2 deletions
diff --git a/‎keras/src/backend/numpy/trainer.py‎
Lines changed: 2 additions & 2 deletions b/‎keras/src/backend/numpy/trainer.py‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎keras/src/backend/tensorflow/core.py‎
Lines changed: 13 additions & 0 deletions b/‎keras/src/backend/tensorflow/core.py‎
Lines changed: 13 additions & 0 deletions
@@ -22,6 +22,7 @@
 from keras.src.ops.core import slice
 from keras.src.ops.core import slice_update
 from keras.src.ops.core import stop_gradient
+from keras.src.ops.core import switch
 from keras.src.ops.core import unstack
 from keras.src.ops.core import vectorized_map
 from keras.src.ops.core import while_loop
 
@@ -22,6 +22,7 @@
 from keras.src.ops.core import slice
 from keras.src.ops.core import slice_update
 from keras.src.ops.core import stop_gradient
+from keras.src.ops.core import switch
 from keras.src.ops.core import unstack
 from keras.src.ops.core import vectorized_map
 from keras.src.ops.core import while_loop
 
@@ -287,6 +287,10 @@ def slice_update(inputs, start_indices, updates):
     return jax.lax.dynamic_update_slice(inputs, updates, start_indices)
 
 
+def switch(index, branches, *operands):
+    return jax.lax.switch(index, branches, *operands)
+
+
 def while_loop(
     cond,
     body,
 
@@ -40,11 +40,11 @@ def top_k(x, k, sorted=True):
 
 
 def in_top_k(targets, predictions, k):
-    targets = targets[..., None]
-    topk_values = top_k(predictions, k)[0]
-    targets_values = jnp.take_along_axis(predictions, targets, axis=-1)
-    mask = targets_values >= topk_values
-    return jnp.any(mask, axis=1)
+    preds_at_label = jnp.take_along_axis(
+        predictions, jnp.expand_dims(targets, axis=-1), axis=-1
+    )
+    rank = 1 + jnp.sum(jnp.greater(predictions, preds_at_label), axis=-1)
+    return jnp.less_equal(rank, k)
 
 
 def logsumexp(x, axis=None, keepdims=False):
 
@@ -598,10 +598,10 @@ def imag(x):
     return jnp.imag(x)
 
 
-def isclose(x1, x2):
+def isclose(x1, x2, rtol=1e-5, atol=1e-8, equal_nan=False):
     x1 = convert_to_tensor(x1)
     x2 = convert_to_tensor(x2)
-    return jnp.isclose(x1, x2)
+    return jnp.isclose(x1, x2, rtol, atol, equal_nan)
 
 
 @sparse.densifying_unary
 
@@ -63,6 +63,7 @@ def compute_loss_and_updates(
             y=y,
             y_pred=y_pred,
             sample_weight=sample_weight,
+            training=training,
         )
         if losses:
             self._losses_override.clear()
 
@@ -1,3 +1,5 @@
+import warnings
+
 import numpy as np
 
 from keras.src import tree
@@ -241,6 +243,12 @@ def slice_update(inputs, start_indices, updates):
     return inputs
 
 
+def switch(index, branches, *operands):
+    index = convert_to_tensor(index, "int32")
+    index = np.clip(index, 0, len(branches) - 1)
+    return branches[index](*operands)
+
+
 def while_loop(
     cond,
     body,
@@ -279,7 +287,21 @@ def unstack(x, num=None, axis=0):
     return [x[i] for i in range(x.shape[0])]
 
 
-def custom_gradient(fun):
-    raise NotImplementedError(
-        "`custom_gradient` is not supported with numpy backend"
-    )
+class custom_gradient:
+    """Decorator for custom gradients.
+
+    Args:
+        fun: Forward pass function.
+    """
+
+    def __init__(self, fun):
+        warnings.warn(
+            "`custom_gradient` for the numpy backend acts as a pass-through to "
+            "support the forward pass. No gradient computation or modification "
+            "takes place."
+        )
+        self.fun = fun
+
+    def __call__(self, *args, **kwargs):
+        outputs, _ = self.fun(*args, **kwargs)
+        return outputs
@@ -65,6 +65,8 @@ def matmul(x1, x2):
         dtype = "int32"
     else:
         dtype = dtypes.result_type(x1.dtype, x2.dtype)
+    x1 = x1.astype(dtype)
+    x2 = x2.astype(dtype)
     return np.matmul(x1, x2).astype(dtype)
 
 
@@ -505,8 +507,8 @@ def imag(x):
     return np.imag(x)
 
 
-def isclose(x1, x2):
-    return np.isclose(x1, x2)
+def isclose(x1, x2, rtol=1e-5, atol=1e-8, equal_nan=False):
+    return np.isclose(x1, x2, rtol, atol, equal_nan)
 
 
 def isfinite(x):
 
@@ -28,8 +28,8 @@ def test_step(self, data):
             y_pred = self(x, training=False)
         else:
             y_pred = self(x)
-        loss = self.compute_loss(
-            x=x, y=y, y_pred=y_pred, sample_weight=sample_weight
+        loss = self._compute_loss(
+            x=x, y=y, y_pred=y_pred, sample_weight=sample_weight, training=False
         )
         self._loss_tracker.update_state(
             loss, sample_weight=tree.flatten(x)[0].shape[0]
 
@@ -355,6 +355,19 @@ def slice_update(inputs, start_indices, updates):
     return dynamic_update_slice(inputs, updates, start_indices)
 
 
+def switch(index, branches, *operands):
+    index = convert_to_tensor(index, "int32")
+    index = tf.clip_by_value(index, 0, len(branches) - 1)
+
+    # Workaround to deal with python closures. More details:
+    # https://github.com/tensorflow/tensorflow/issues/8776#issuecomment-311383887
+    def gen_fn(i):
+        return lambda: branches[i](*operands)
+
+    branch_fns = [gen_fn(i) for i in range(len(branches))]
+    return tf.switch_case(index, branch_fns)
+
+
 def while_loop(
     cond,
     body,
Original file line number	Diff line number	Diff line change
`@@ -63,6 +63,7 @@ def compute_loss_and_updates(`
`63`	`63`	`y=y,`
`64`	`64`	`y_pred=y_pred,`
`65`	`65`	`sample_weight=sample_weight,`
	`66`	`+ training=training,`
`66`	`67`	`)`
`67`	`68`	`if losses:`
`68`	`69`	`self._losses_override.clear()`