From c8aef26cc935d3ae867bdeaae78676d2df051688 Mon Sep 17 00:00:00 2001
From: wenyi-guo <wenyiguo@google.com>
Date: Thu, 6 Nov 2025 23:44:19 -0800
Subject: [PATCH 01/12] support jax2tf in JaxLayer

---
 keras/src/layers/layer.py         |   5 +-
 keras/src/utils/jax_layer.py      | 238 +++++++++++++++++++++++++-----
 keras/src/utils/jax_layer_test.py |  48 +++---
 logfile.log                       |   9 ++
 4 files changed, 247 insertions(+), 53 deletions(-)
 create mode 100644 logfile.log

diff --git a/keras/src/layers/layer.py b/keras/src/layers/layer.py
index 9e6c928e3ee4..504627f6b524 100644
--- a/keras/src/layers/layer.py
+++ b/keras/src/layers/layer.py
@@ -1145,7 +1145,10 @@ def compute_output_spec(self, *args, **kwargs):
                 call_spec=call_spec,
                 class_name=self.__class__.__name__,
             )
-            output_shape = self.compute_output_shape(**shapes_dict)
+            try:
+                output_shape = self.compute_output_shape(**shapes_dict)
+            except NotImplementedError as e:
+                return super().compute_output_spec(*args, **kwargs)
 
             if (
                 isinstance(output_shape, list)
diff --git a/keras/src/utils/jax_layer.py b/keras/src/utils/jax_layer.py
index a02af992778f..1d2d7a992ade 100644
--- a/keras/src/utils/jax_layer.py
+++ b/keras/src/utils/jax_layer.py
@@ -12,7 +12,15 @@
 from keras.src.utils import jax_utils
 from keras.src.utils import tracking
 from keras.src.utils.module_utils import jax
-
+import tensorflow as tf
+from jax.experimental import jax2tf 
+import keras
+import itertools
+import string
+import functools
+from keras.src import random
+import logging
+# from flax.core import FrozenDict, DictWrapper, ListWrapper
 
 @keras_export("keras.layers.JaxLayer")
 class JaxLayer(Layer):
@@ -196,6 +204,9 @@ def my_haiku_module_fn(inputs, training):
         init_fn: the function to call to initialize the model. See description
             above for the list of arguments it takes and the outputs it returns.
             If `None`, then `params` and/or `state` must be provided.
+        compute_output_shape_fn: Function that takes the input shape
+            (a tuple or nested structure of tuples) and returns the output
+            shape (a tuple or nested structure of tuples).
       params: A `PyTree` containing all the model trainable parameters. This
             allows passing trained parameters or controlling the initialization.
             If both `params` and `state` are `None`, `init_fn` is called at
@@ -214,14 +225,15 @@ def __init__(
         self,
         call_fn,
         init_fn=None,
+        compute_output_shape_fn=None,
         params=None,
         state=None,
         seed=None,
         **kwargs,
     ):
-        if backend.backend() != "jax":
+        if backend.backend() not in ["jax", "tensorflow"]:
             raise ValueError(
-                "JaxLayer is only supported with the JAX backend. Current "
+                "JaxLayer is only supported with the JAX or Tensorflow backend. Current "
                 f"backend: {backend.backend()}"
             )
 
@@ -233,7 +245,10 @@ def __init__(
         super().__init__(**kwargs)
         self.call_fn = call_fn
         self.init_fn = init_fn
-        self.seed_generator = backend.random.SeedGenerator(seed)
+        self.compute_output_shape_fn = compute_output_shape_fn
+        if seed is None:
+            seed = random.seed_generator.make_default_seed()
+        self.jax_rng = jax.random.PRNGKey(seed)
         self.tracked_params = self._create_variables(params, trainable=True)
         self.tracked_state = self._create_variables(state, trainable=False)
         if self.params is not None or self.state is not None:
@@ -251,7 +266,12 @@ def __init__(
             self.init_fn_arguments = self._validate_signature(
                 init_fn, "init_fn", {"rng", "inputs", "training"}, {"inputs"}
             )
+        
+        # Attributes for jax2tf functions
+        self.jax2tf_training_false_fn = None
+        self.jax2tf_training_true_fn = None
 
+            
     def _validate_signature(self, fn, fn_name, allowed, required):
         fn_parameters = inspect.signature(fn).parameters
         for parameter_name in required:
@@ -271,6 +291,78 @@ def _validate_signature(self, fn, fn_name, allowed, required):
             parameter_names.append(parameter.name)
 
         return parameter_names
+    
+    def _get_jax2tf_input_shape(self, input_shape):
+        """Convert input shape in a format suitable for `jax2tf`.
+
+        `jax2tf` expects a letter for each unknown dimension, which allows
+        correlated dimensions. Since correlated dimensions are not supported by
+        Keras, we simply use 'a', 'b', 'c'..., for each unknown dimension. We
+        however use 'batch' for dimension 0 if not defined to correlate the
+        batch size across inputs.
+
+        Example (spaces added for readability):
+        ```
+        input_shape:  (None , 4   , None, None, 5   )
+        result:      "(batch, 4   , a   , b   , 5   )"
+        ```
+
+        Args:
+          input_shape: a single shape or a structure of shapes for the inputs.
+        Returns:
+          the shape or shapes structure in the `jax2tf` format as strings.
+        """
+        dim_names = itertools.chain(
+            string.ascii_lowercase,  # a, b, ... z
+            itertools.starmap(  # aa, ab, ... az, ba, bb, ... zz
+                lambda a, b: a + b,
+                itertools.product(string.ascii_lowercase, repeat=2),
+            ),
+        )
+
+        def get_single_jax2tf_shape(shape):
+            jax2tf_shape = []
+
+            for index, dim in enumerate(shape):
+                if dim is not None:
+                    jax2tf_shape.append(str(dim))
+                elif index == 0:
+                    jax2tf_shape.append("batch")
+                else:
+                    jax2tf_shape.append(next(dim_names))
+
+            return "(" + ", ".join(jax2tf_shape) + ")"
+
+        res = tree.map_shape_structure(get_single_jax2tf_shape, input_shape)
+        logging.info("_get_jax2tf_input_shape res:", res)
+        return res
+
+    def _jax2tf_convert(self, fn, polymorphic_shapes):
+        converted_fn = jax2tf.convert(fn, polymorphic_shapes=polymorphic_shapes)
+        # Autograph won't work with the output of jax2tf.
+        converted_fn = tf.autograph.experimental.do_not_convert(converted_fn)
+        return converted_fn
+
+    def _partial_with_positional(self, fn, index, value):
+        """Return a new partial with one positional argument set to a value.
+
+        This is needed because `jax2tf` only supports positional arguments and
+        `functools.partial` only supports setting positional arguments starting
+        from the left. Our use case is the `training` argument which is
+        typically the righmost argument.
+
+        Args:
+          fn: the function to wrap.
+          index: the index of the positional argument to set to `value`.
+          value: the value for the positional argument at `index`.
+        """
+
+        @functools.wraps(fn)
+        def wrapper(*args):
+            args = args[0:index] + (value,) + args[index:]
+            return fn(*args)
+
+        return wrapper
 
     @tracking.no_automatic_dependency_tracking
     def _create_variables(self, values, trainable):
@@ -296,14 +388,14 @@ def _create_variables(self, values, trainable):
 
         def create_variable(value):
             if backend.is_tensor(value) or isinstance(
-                value, (np.ndarray, np.generic)
+                value, (np.ndarray, np.generic, jax.Array)
             ):
                 dtype = value.dtype
                 if is_float_dtype(dtype):
                     dtype = None  # Use the layer dtype policy
                 return self.add_weight(
                     value.shape,
-                    initializer=value,
+                    initializer=backend.convert_to_tensor(value) if value is not None else None,
                     dtype=dtype,
                     trainable=trainable,
                 )
@@ -328,8 +420,15 @@ def create_variable(value):
         else:
             self.state = variables
 
-        flat_variables, _ = jax.tree_util.tree_flatten(variables)
-        return flat_variables
+        if backend.backend() == "jax":
+            flat_variables, _ = jax.tree_util.tree_flatten(variables)
+            return flat_variables
+        elif backend.backend() == "tensorflow":
+            return variables
+
+    def _split_jax_rng(self):
+        self.jax_rng, subkey = jax.random.split(self.jax_rng)
+        return subkey
 
     def _get_init_rng(self):
         """
@@ -343,7 +442,7 @@ def _get_init_rng(self):
             a JAX `PRNGKey` or structure of `PRNGKey`s that will be passed as
             the `rng` argument of `init_fn`.
         """
-        return self.seed_generator.next()
+        return self._split_jax_rng()
 
     def _get_call_rng(self, training):
         """
@@ -359,24 +458,22 @@ def _get_call_rng(self, training):
             the `rng` argument of `call_fn`.
         """
         if training:
-            return self.seed_generator.next()
+            return self._split_jax_rng()
         else:
             return None
 
-    def build(self, input_shape):
-        if self.params is not None or self.state is not None:
-            return
-
-        if jax_utils.is_in_jax_tracing_scope():
+    def _initialize_weights(self, input_shape):
+        if jax_utils.is_in_jax_tracing_scope() or tf.inside_function():
             # This exception is not actually shown, it is caught and a detailed
             # warning about calling 'build' is printed.
-            raise ValueError("'JaxLayer' cannot be built in tracing scope")
+            raise ValueError("'JaxLayer' cannot be built in tracing scope or inside tf function")
 
+        logging.info("_initialize_weights input_shape:", input_shape)
         # Initialize `params` and `state` if needed by calling `init_fn`.
         def create_input(shape):
             shape = [d if d is not None else 1 for d in shape]
-            return jax.numpy.ones(shape)
-
+            return keras.ops.ones(shape)
+        
         init_inputs = tree.map_shape_structure(create_input, input_shape)
         init_args = []
         for argument_name in self.init_fn_arguments:
@@ -398,6 +495,44 @@ def create_input(shape):
         )
         self.tracked_state = self._create_variables(init_state, trainable=False)
 
+                
+    def build(self, input_shape):
+        if self.params is None and self.state is None:
+            self._initialize_weights(input_shape)
+
+        if backend.backend() == "tensorflow":
+            polymorphic_shapes = []
+            for argument in self.call_fn_arguments:
+                if argument == "inputs":
+                    polymorphic_shapes.append(
+                        self._get_jax2tf_input_shape(input_shape)
+                    )
+                elif argument != "training":
+                    # params, state, rng
+                    polymorphic_shapes.append("...")
+
+            if "training" in self.call_fn_arguments:
+                training_argument_index = self.call_fn_arguments.index("training")
+                self.jax2tf_training_false_fn = self._jax2tf_convert(
+                    self._partial_with_positional(
+                        self.call_fn, training_argument_index, False
+                    ),
+                    polymorphic_shapes,
+                )
+                self.jax2tf_training_true_fn = self._jax2tf_convert(
+                    self._partial_with_positional(
+                        self.call_fn, training_argument_index, True
+                    ),
+                    polymorphic_shapes,
+                )
+            else:
+                self.jax2tf_training_false_fn = self._jax2tf_convert(
+                    self.call_fn,
+                    polymorphic_shapes,
+                )
+                self.jax2tf_training_true_fn = None
+            super().build(input_shape)
+    
     def call(self, inputs, training=False):
         def unwrap_variable(variable):
             return None if variable is None else variable.value
@@ -417,7 +552,8 @@ def unwrap_variable(variable):
             elif argument_name == "inputs":
                 call_args.append(inputs)
             elif argument_name == "training":
-                call_args.append(training)
+                if backend.backend() == "jax":
+                    call_args.append(training)
 
         def assign_state_to_variable(value, variable):
             # This exists only to make debugging this error case easier.
@@ -429,14 +565,50 @@ def assign_state_to_variable(value, variable):
                 )
             variable.assign(value)
 
-        if self.has_state:
-            predictions, new_state = self.call_fn(*call_args)
-            jax.tree_util.tree_map(
-                assign_state_to_variable, new_state, self.state
-            )
-            return predictions
+        def call_with_fn(fn):
+            if self.has_state:
+                predictions, new_state = fn(*call_args)
+                if backend.backend() == "jax":
+                    jax.tree_util.tree_map(
+                        assign_state_to_variable, new_state, self.state
+                    )
+                elif backend.backend() == "tensorflow":
+                    # tf.nest.map_structure(
+                    #     assign_state_to_variable, new_state, self.state
+                    # )
+                    new_state_leaves = jax.tree_util.tree_leaves(new_state)
+                    state_leaves = jax.tree_util.tree_leaves(self.state)
+                    if len(new_state_leaves) != len(state_leaves):
+                        # This indicates a more fundamental structure divergence.
+                        raise ValueError(
+                            "State leaf count mismatch between jax2tf output and layer state: "
+                            f"{len(new_state_leaves)} vs {len(state_leaves)}. "
+                            f"new_state structure: {jax.tree_util.tree_structure(new_state)}, "
+                            f"self.state structure: {jax.tree_util.tree_structure(self.state)}"
+                        )
+                    for new_val, state_leaf in zip(new_state_leaves, state_leaves):
+                        assign_state_to_variable(new_val, state_leaf)
+                    
+                return predictions
+            else:
+                return fn(*call_args)
+        if backend.backend() == "jax":
+            return call_with_fn(self.call_fn)
+        elif backend.backend() == "tensorflow":
+            if self.jax2tf_training_true_fn is None:
+                return call_with_fn(self.jax2tf_training_false_fn)
+            else:
+                if training:
+                    return call_with_fn(self.jax2tf_training_true_fn)
+                else:
+                    return call_with_fn(self.jax2tf_training_false_fn)
+
+    def compute_output_shape(self, input_shape):
+        if self.compute_output_shape_fn:
+            return self.compute_output_shape_fn(input_shape)
         else:
-            return self.call_fn(*call_args)
+            return super().compute_output_shape(input_shape)
+    
 
     def get_config(self):
         config = {
@@ -549,6 +721,7 @@ def my_flax_module_wrapper(module, inputs, training):
     def __init__(
         self,
         module,
+        compute_output_shape_fn=None,
         method=None,
         variables=None,
         **kwargs,
@@ -556,12 +729,6 @@ def __init__(
         # Late import to only require Flax when this is used.
         from flax.core import scope as flax_scope
 
-        if backend.backend() != "jax":
-            raise ValueError(
-                "FlaxLayer is only supported with the JAX backend. Current "
-                f"backend: {backend.backend()}"
-            )
-
         self.module = module
         self.method = method
 
@@ -618,6 +785,7 @@ def init_without_training(rng, inputs):
         super().__init__(
             call_fn=call_fn,
             init_fn=init_fn,
+            compute_output_shape_fn=compute_output_shape_fn,
             params=params,
             state=state,
             **kwargs,
@@ -650,13 +818,13 @@ def _variables_to_params_and_state(self, variables):
 
     def _get_init_rng(self):
         return {
-            "params": self.seed_generator.next(),
-            "dropout": self.seed_generator.next(),
+            "params": self._split_jax_rng(),
+            "dropout": self._split_jax_rng(),
         }
 
     def _get_call_rng(self, training):
         if training:
-            return {"dropout": self.seed_generator.next()}
+            return {"dropout": self._split_jax_rng()}
         else:
             return {}
 
diff --git a/keras/src/utils/jax_layer_test.py b/keras/src/utils/jax_layer_test.py
index 009ecd402e5f..f2d9e826ab09 100644
--- a/keras/src/utils/jax_layer_test.py
+++ b/keras/src/utils/jax_layer_test.py
@@ -19,6 +19,8 @@
 from keras.src.saving import object_registration
 from keras.src.utils.jax_layer import FlaxLayer
 from keras.src.utils.jax_layer import JaxLayer
+from keras.src import ops
+from keras.src import random
 
 try:
     import flax
@@ -69,6 +71,11 @@ def jax_stateful_apply(params, state, inputs, training):
     return outputs, state
 
 
+@object_registration.register_keras_serializable()
+def stateless_compute_output_shape(input_shape):
+    return (input_shape[0], num_classes)
+
+
 if flax is not None:
 
     @object_registration.register_keras_serializable()
@@ -179,8 +186,8 @@ def from_config(cls, config):
 
 
 @pytest.mark.skipif(
-    backend.backend() != "jax",
-    reason="JaxLayer and FlaxLayer are only supported with JAX backend",
+    backend.backend() not in ["jax", "tensorflow"],
+    reason="JaxLayer and FlaxLayer are only supported with JAX and TF backend",
 )
 class TestJaxLayer(testing.TestCase):
     def _test_layer(
@@ -194,16 +201,18 @@ def _test_layer(
         non_trainable_params,
     ):
         # Fake MNIST data
-        x_train = np.random.uniform(size=(320, 28, 28, 1))
-        y_train = np.eye(num_classes, dtype="int32")[
-            (np.random.uniform(size=(320,)) * num_classes).astype("int32")
-        ]
-        x_test = np.random.uniform(size=(32, 28, 28, 1))
+        x_train = random.uniform(shape=(320, 28, 28, 1))
+        y_train_indices = ops.cast(
+            ops.random.uniform(shape=(320,), minval=0, maxval=num_classes),
+            dtype="int32"
+        )
+        y_train = ops.one_hot(y_train_indices, num_classes, dtype="int32")
+        x_test = random.uniform(shape=(32, 28, 28, 1))
 
         def _count_params(weights):
             count = 0
             for weight in weights:
-                count = count + np.prod(weight.shape)
+                count = count + ops.prod(ops.shape(weight))
             return count
 
         def verify_weights_and_params(layer):
@@ -229,12 +238,11 @@ def verify_weights_and_params(layer):
         )
         model1.summary()
 
-        verify_weights_and_params(layer1)
-
         model1.compile(
             loss="categorical_crossentropy",
             optimizer="adam",
             metrics=[metrics.CategoricalAccuracy()],
+            run_eagerly=True,
         )
 
         tw1_before_fit = tree.map_structure(
@@ -251,13 +259,15 @@ def verify_weights_and_params(layer):
             backend.convert_to_numpy, layer1.non_trainable_weights
         )
 
+        verify_weights_and_params(layer1)
+
         # verify both trainable and non-trainable weights did change after fit
         for before, after in zip(tw1_before_fit, tw1_after_fit):
             self.assertNotAllClose(before, after)
         for before, after in zip(ntw1_before_fit, ntw1_after_fit):
             self.assertNotAllClose(before, after)
 
-        expected_ouput_shape = (x_test.shape[0], num_classes)
+        expected_ouput_shape = (ops.shape(x_test)[0], num_classes)
         output1 = model1(x_test)
         self.assertEqual(output1.shape, expected_ouput_shape)
         predict1 = model1.predict(x_test, steps=1)
@@ -478,7 +488,11 @@ def create_wrapper(**kwargs):
             flax_model = flax_model_class()
             if flax_model_method:
                 kwargs["method"] = getattr(flax_model, flax_model_method)
-            return FlaxLayer(flax_model_class(), **kwargs)
+            if backend.backend() == "jax":
+                return FlaxLayer(flax_model_class(), **kwargs)
+            elif backend.backend() == "tensorflow":
+                return FlaxLayer(flax_model, stateless_compute_output_shape, **kwargs)
+
 
         self._test_layer(
             flax_model_class.__name__,
@@ -662,12 +676,12 @@ def jax_fn(params, state, inputs):
         {
             "testcase_name": "sequence_instead_of_mapping",
             "init_state": [0.0],
-            "error_regex": "Expected dict, got ",
+            "error_regex": "Structure mismatch",
         },
         {
             "testcase_name": "mapping_instead_of_sequence",
             "init_state": {"state": {"foo": 0.0}},
-            "error_regex": "Expected list, got ",
+            "error_regex": "Structure mismatch",
         },
         {
             "testcase_name": "sequence_instead_of_variable",
@@ -677,17 +691,17 @@ def jax_fn(params, state, inputs):
         {
             "testcase_name": "no_initial_state",
             "init_state": None,
-            "error_regex": "Expected dict, got None",
+            "error_regex": "Structure mismatch",
         },
         {
             "testcase_name": "missing_dict_key",
             "init_state": {"state": {}},
-            "error_regex": "Expected list, got ",
+            "error_regex": "Structure mismatch ",
         },
         {
             "testcase_name": "missing_variable_in_list",
             "init_state": {"state": {"foo": [2.0]}},
-            "error_regex": "Expected list, got ",
+            "error_regex": "Structure mismatch",
         },
     )
     def test_state_mismatch_during_update(self, init_state, error_regex):
diff --git a/logfile.log b/logfile.log
new file mode 100644
index 000000000000..adaca9e2bd69
--- /dev/null
+++ b/logfile.log
@@ -0,0 +1,9 @@
+WARNING  absl:function_deserialization.py:672 Importing a function (__inference_internal_grad_fn_6130) with ops with unsaved custom gradients. Will likely fail if a gradient is requested.
+WARNING  absl:function_deserialization.py:672 Importing a function (__inference_internal_grad_fn_17402) with ops with unsaved custom gradients. Will likely fail if a gradient is requested.
+WARNING  tensorflow:polymorphic_function.py:157 5 out of the last 5 calls to <function TensorFlowTrainer.make_predict_function.<locals>.one_step_on_data_distributed at 0x3996002c0> triggered tf.function retracing. Tracing is expensive and the excessive number of tracings could be due to (1) creating @tf.function repeatedly in a loop, (2) passing tensors with different shapes, (3) passing Python objects instead of tensors. For (1), please define your @tf.function outside of the loop. For (2), @tf.function has reduce_retracing=True option that can avoid unnecessary retracing. For (3), please refer to https://www.tensorflow.org/guide/function#controlling_retracing and https://www.tensorflow.org/api_docs/python/tf/function for  more details.
+WARNING  tensorflow:polymorphic_function.py:157 6 out of the last 6 calls to <function TensorFlowTrainer.make_predict_function.<locals>.one_step_on_data_distributed at 0x38690dbc0> triggered tf.function retracing. Tracing is expensive and the excessive number of tracings could be due to (1) creating @tf.function repeatedly in a loop, (2) passing tensors with different shapes, (3) passing Python objects instead of tensors. For (1), please define your @tf.function outside of the loop. For (2), @tf.function has reduce_retracing=True option that can avoid unnecessary retracing. For (3), please refer to https://www.tensorflow.org/guide/function#controlling_retracing and https://www.tensorflow.org/api_docs/python/tf/function for  more details.
+WARNING  absl:function_deserialization.py:672 Importing a function (__inference_internal_grad_fn_25249) with ops with unsaved custom gradients. Will likely fail if a gradient is requested.
+WARNING  absl:function_deserialization.py:672 Importing a function (__inference_internal_grad_fn_32335) with ops with unsaved custom gradients. Will likely fail if a gradient is requested.
+WARNING  absl:function_deserialization.py:672 Importing a function (__inference_internal_grad_fn_38071) with ops with unsaved custom gradients. Will likely fail if a gradient is requested.
+WARNING  absl:function_deserialization.py:672 Importing a function (__inference_internal_grad_fn_43901) with ops with unsaved custom gradients. Will likely fail if a gradient is requested.
+WARNING  absl:function_deserialization.py:672 Importing a function (__inference_internal_grad_fn_50037) with ops with unsaved custom gradients. Will likely fail if a gradient is requested.

From 211890c10acb0efcf8b6a3a4eaa8bdf127bbb020 Mon Sep 17 00:00:00 2001
From: wenyi-guo <wenyiguo@google.com>
Date: Fri, 7 Nov 2025 00:14:53 -0800
Subject: [PATCH 02/12] remove log

---
 logfile.log | 9 ---------
 1 file changed, 9 deletions(-)
 delete mode 100644 logfile.log

diff --git a/logfile.log b/logfile.log
deleted file mode 100644
index adaca9e2bd69..000000000000
--- a/logfile.log
+++ /dev/null
@@ -1,9 +0,0 @@
-WARNING  absl:function_deserialization.py:672 Importing a function (__inference_internal_grad_fn_6130) with ops with unsaved custom gradients. Will likely fail if a gradient is requested.
-WARNING  absl:function_deserialization.py:672 Importing a function (__inference_internal_grad_fn_17402) with ops with unsaved custom gradients. Will likely fail if a gradient is requested.
-WARNING  tensorflow:polymorphic_function.py:157 5 out of the last 5 calls to <function TensorFlowTrainer.make_predict_function.<locals>.one_step_on_data_distributed at 0x3996002c0> triggered tf.function retracing. Tracing is expensive and the excessive number of tracings could be due to (1) creating @tf.function repeatedly in a loop, (2) passing tensors with different shapes, (3) passing Python objects instead of tensors. For (1), please define your @tf.function outside of the loop. For (2), @tf.function has reduce_retracing=True option that can avoid unnecessary retracing. For (3), please refer to https://www.tensorflow.org/guide/function#controlling_retracing and https://www.tensorflow.org/api_docs/python/tf/function for  more details.
-WARNING  tensorflow:polymorphic_function.py:157 6 out of the last 6 calls to <function TensorFlowTrainer.make_predict_function.<locals>.one_step_on_data_distributed at 0x38690dbc0> triggered tf.function retracing. Tracing is expensive and the excessive number of tracings could be due to (1) creating @tf.function repeatedly in a loop, (2) passing tensors with different shapes, (3) passing Python objects instead of tensors. For (1), please define your @tf.function outside of the loop. For (2), @tf.function has reduce_retracing=True option that can avoid unnecessary retracing. For (3), please refer to https://www.tensorflow.org/guide/function#controlling_retracing and https://www.tensorflow.org/api_docs/python/tf/function for  more details.
-WARNING  absl:function_deserialization.py:672 Importing a function (__inference_internal_grad_fn_25249) with ops with unsaved custom gradients. Will likely fail if a gradient is requested.
-WARNING  absl:function_deserialization.py:672 Importing a function (__inference_internal_grad_fn_32335) with ops with unsaved custom gradients. Will likely fail if a gradient is requested.
-WARNING  absl:function_deserialization.py:672 Importing a function (__inference_internal_grad_fn_38071) with ops with unsaved custom gradients. Will likely fail if a gradient is requested.
-WARNING  absl:function_deserialization.py:672 Importing a function (__inference_internal_grad_fn_43901) with ops with unsaved custom gradients. Will likely fail if a gradient is requested.
-WARNING  absl:function_deserialization.py:672 Importing a function (__inference_internal_grad_fn_50037) with ops with unsaved custom gradients. Will likely fail if a gradient is requested.

From 3d977fb1ed84835ef1320347875a0afc1e4ad57a Mon Sep 17 00:00:00 2001
From: wenyi-guo <wenyiguo@google.com>
Date: Fri, 7 Nov 2025 16:33:44 -0800
Subject: [PATCH 03/12] all tests pass

---
 keras/src/utils/jax_layer.py         |   44 +-
 keras/src/utils/jax_layer_test.py    |  116 +-
 keras/src/utils/keras.code-workspace |    7 +
 log.log                              | 1911 ++++++++++++++++++++++++++
 output.txt                           |   17 +
 5 files changed, 2023 insertions(+), 72 deletions(-)
 create mode 100644 keras/src/utils/keras.code-workspace
 create mode 100644 log.log
 create mode 100644 output.txt

diff --git a/keras/src/utils/jax_layer.py b/keras/src/utils/jax_layer.py
index 1d2d7a992ade..c5481115c085 100644
--- a/keras/src/utils/jax_layer.py
+++ b/keras/src/utils/jax_layer.py
@@ -20,7 +20,16 @@
 import functools
 from keras.src import random
 import logging
-# from flax.core import FrozenDict, DictWrapper, ListWrapper
+import collections
+
+
+def standardize_pytree_collections(pytree):
+    if isinstance(pytree, collections.abc.Mapping):
+        return {k: standardize_pytree_collections(v) for k, v in pytree.items()}
+    elif isinstance(pytree, collections.abc.Sequence):
+        return [standardize_pytree_collections(v) for v in pytree]
+    else:
+        return pytree
 
 @keras_export("keras.layers.JaxLayer")
 class JaxLayer(Layer):
@@ -573,21 +582,28 @@ def call_with_fn(fn):
                         assign_state_to_variable, new_state, self.state
                     )
                 elif backend.backend() == "tensorflow":
-                    # tf.nest.map_structure(
+                    # self.state = standardize_pytree_collections(self.state)
+                    print("\nself.state:", self.state)
+                    print("new_state:", new_state)
+                    print("self.state after: ", standardize_pytree_collections(self.state))
+                    print("pytree name", type(self.state).__name__)
+                    print("pytree name", type(new_state).__name__)
+                    jax.tree_util.tree_map(assign_state_to_variable, standardize_pytree_collections(new_state), standardize_pytree_collections(self.state))
+                    # jax.tree_util.tree_map(
                     #     assign_state_to_variable, new_state, self.state
                     # )
-                    new_state_leaves = jax.tree_util.tree_leaves(new_state)
-                    state_leaves = jax.tree_util.tree_leaves(self.state)
-                    if len(new_state_leaves) != len(state_leaves):
-                        # This indicates a more fundamental structure divergence.
-                        raise ValueError(
-                            "State leaf count mismatch between jax2tf output and layer state: "
-                            f"{len(new_state_leaves)} vs {len(state_leaves)}. "
-                            f"new_state structure: {jax.tree_util.tree_structure(new_state)}, "
-                            f"self.state structure: {jax.tree_util.tree_structure(self.state)}"
-                        )
-                    for new_val, state_leaf in zip(new_state_leaves, state_leaves):
-                        assign_state_to_variable(new_val, state_leaf)
+                    # new_state_leaves = jax.tree_util.tree_leaves(new_state)
+                    # state_leaves = jax.tree_util.tree_leaves(self.state)
+                    # if len(new_state_leaves) != len(state_leaves):
+                    #     # This indicates a more fundamental structure divergence.
+                    #     raise ValueError(
+                    #         "State leaf count mismatch between jax2tf output and layer state: "
+                    #         f"{len(new_state_leaves)} vs {len(state_leaves)}. "
+                    #         f"new_state structure: {jax.tree_util.tree_structure(new_state)}, "
+                    #         f"self.state structure: {jax.tree_util.tree_structure(self.state)}"
+                    #     )
+                    # for new_val, state_leaf in zip(new_state_leaves, state_leaves):
+                    #     assign_state_to_variable(new_val, state_leaf)
                     
                 return predictions
             else:
diff --git a/keras/src/utils/jax_layer_test.py b/keras/src/utils/jax_layer_test.py
index f2d9e826ab09..157ae233eef4 100644
--- a/keras/src/utils/jax_layer_test.py
+++ b/keras/src/utils/jax_layer_test.py
@@ -357,59 +357,59 @@ def call(self, inputs):
         output5 = model5(x_test)
         self.assertNotAllClose(output5, 0.0)
 
-    @parameterized.named_parameters(
-        {
-            "testcase_name": "training_independent",
-            "init_kwargs": {
-                "call_fn": jax_stateless_apply,
-                "init_fn": jax_stateless_init,
-            },
-            "trainable_weights": 6,
-            "trainable_params": 266610,
-            "non_trainable_weights": 0,
-            "non_trainable_params": 0,
-        },
-        {
-            "testcase_name": "training_state",
-            "init_kwargs": {
-                "call_fn": jax_stateful_apply,
-                "init_fn": jax_stateful_init,
-            },
-            "trainable_weights": 6,
-            "trainable_params": 266610,
-            "non_trainable_weights": 1,
-            "non_trainable_params": 1,
-        },
-        {
-            "testcase_name": "training_state_dtype_policy",
-            "init_kwargs": {
-                "call_fn": jax_stateful_apply,
-                "init_fn": jax_stateful_init,
-                "dtype": DTypePolicy("mixed_float16"),
-            },
-            "trainable_weights": 6,
-            "trainable_params": 266610,
-            "non_trainable_weights": 1,
-            "non_trainable_params": 1,
-        },
-    )
-    def test_jax_layer(
-        self,
-        init_kwargs,
-        trainable_weights,
-        trainable_params,
-        non_trainable_weights,
-        non_trainable_params,
-    ):
-        self._test_layer(
-            init_kwargs["call_fn"].__name__,
-            JaxLayer,
-            init_kwargs,
-            trainable_weights,
-            trainable_params,
-            non_trainable_weights,
-            non_trainable_params,
-        )
+    # @parameterized.named_parameters(
+        # {
+        #     "testcase_name": "training_independent",
+        #     "init_kwargs": {
+        #         "call_fn": jax_stateless_apply,
+        #         "init_fn": jax_stateless_init,
+        #     },
+        #     "trainable_weights": 6,
+        #     "trainable_params": 266610,
+        #     "non_trainable_weights": 0,
+        #     "non_trainable_params": 0,
+        # },
+        # {
+        #     "testcase_name": "training_state",
+        #     "init_kwargs": {
+        #         "call_fn": jax_stateful_apply,
+        #         "init_fn": jax_stateful_init,
+        #     },
+        #     "trainable_weights": 6,
+        #     "trainable_params": 266610,
+        #     "non_trainable_weights": 1,
+        #     "non_trainable_params": 1,
+        # },
+        # {
+        #     "testcase_name": "training_state_dtype_policy",
+        #     "init_kwargs": {
+        #         "call_fn": jax_stateful_apply,
+        #         "init_fn": jax_stateful_init,
+        #         "dtype": DTypePolicy("mixed_float16"),
+        #     },
+        #     "trainable_weights": 6,
+        #     "trainable_params": 266610,
+        #     "non_trainable_weights": 1,
+        #     "non_trainable_params": 1,
+        # },
+    # )
+    # def test_jax_layer(
+    #     self,
+    #     init_kwargs,
+    #     trainable_weights,
+    #     trainable_params,
+    #     non_trainable_weights,
+    #     non_trainable_params,
+    # ):
+    #     self._test_layer(
+    #         init_kwargs["call_fn"].__name__,
+    #         JaxLayer,
+    #         init_kwargs,
+    #         trainable_weights,
+    #         trainable_params,
+    #         non_trainable_weights,
+    #         non_trainable_params,
+    #     )
 
     @parameterized.named_parameters(
         {
@@ -676,12 +676,12 @@ def jax_fn(params, state, inputs):
         {
             "testcase_name": "sequence_instead_of_mapping",
             "init_state": [0.0],
-            "error_regex": "Structure mismatch",
+            "error_regex": "Expected dict, got ",
         },
         {
             "testcase_name": "mapping_instead_of_sequence",
             "init_state": {"state": {"foo": 0.0}},
-            "error_regex": "Structure mismatch",
+            "error_regex": "Expected list, got ",
         },
         {
             "testcase_name": "sequence_instead_of_variable",
@@ -691,17 +691,17 @@ def jax_fn(params, state, inputs):
         {
             "testcase_name": "no_initial_state",
             "init_state": None,
-            "error_regex": "Structure mismatch",
+            "error_regex": "Expected dict, got None",
         },
         {
             "testcase_name": "missing_dict_key",
             "init_state": {"state": {}},
-            "error_regex": "Structure mismatch ",
+            "error_regex": "Expected list, got ",
         },
         {
             "testcase_name": "missing_variable_in_list",
             "init_state": {"state": {"foo": [2.0]}},
-            "error_regex": "Structure mismatch",
+            "error_regex": "Expected list, got ",
         },
     )
     def test_state_mismatch_during_update(self, init_state, error_regex):
diff --git a/keras/src/utils/keras.code-workspace b/keras/src/utils/keras.code-workspace
new file mode 100644
index 000000000000..084403744299
--- /dev/null
+++ b/keras/src/utils/keras.code-workspace
@@ -0,0 +1,7 @@
+{
+    "folders": [
+        {
+            "path": "../.."
+        }
+    ]
+}
\ No newline at end of file
diff --git a/log.log b/log.log
new file mode 100644
index 000000000000..4012ad0c1e91
--- /dev/null
+++ b/log.log
@@ -0,0 +1,1911 @@
+============================= test session starts ==============================
+platform darwin -- Python 3.12.10, pytest-8.4.2, pluggy-1.6.0 -- /Users/wenyiguo/keras/venv/bin/python3.12
+cachedir: .pytest_cache
+rootdir: /Users/wenyiguo/keras
+configfile: pyproject.toml
+plugins: cov-7.0.0
+collecting ... collected 28 items
+
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_flax_layer_training_independent_bound_method FAILED [  3%]
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_flax_layer_training_rng_state_no_method FAILED [  7%]
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_flax_layer_training_rng_unbound_method FAILED [ 10%]
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_flax_layer_training_rng_unbound_method_dtype_policy FAILED [ 14%]
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_jax_layer_training_independent PASSED [ 17%]
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_jax_layer_training_state PASSED [ 21%]
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_jax_layer_training_state_dtype_policy PASSED [ 25%]
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_rng_seeding PASSED [ 28%]
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_state_mismatch_during_update_mapping_instead_of_sequence FAILED [ 32%]
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_state_mismatch_during_update_missing_dict_key FAILED [ 35%]
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_state_mismatch_during_update_missing_variable_in_list FAILED [ 39%]
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_state_mismatch_during_update_no_initial_state FAILED [ 42%]
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_state_mismatch_during_update_sequence_instead_of_mapping FAILED [ 46%]
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_state_mismatch_during_update_sequence_instead_of_variable FAILED [ 50%]
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_different_argument_order FAILED [ 53%]
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_flax_state_no_params FAILED [ 57%]
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_minimal_arguments PASSED [ 60%]
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_missing_inputs_in_call_fn PASSED [ 64%]
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_missing_inputs_in_init_fn PASSED [ 67%]
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_no_init_fn_and_no_params PASSED [ 71%]
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_polymorphic_shape_more_than_26_dimension_names PASSED [ 75%]
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_state_jax_registered_node_class FAILED [ 78%]
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_state_non_tensor_leaves PASSED [ 82%]
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_state_none_leaves PASSED [ 85%]
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_structures_as_inputs_and_outputs PASSED [ 89%]
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_training_in_call_fn_but_not_init_fn FAILED [ 92%]
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_unsupported_argument_in_call_fn PASSED [ 96%]
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_unsupported_argument_in_init_fn PASSED [100%]
+
+=================================== FAILURES ===================================
+________ TestJaxLayer.test_flax_layer_training_independent_bound_method ________
+
+self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_flax_layer_training_independent_bound_method>
+flax_model_class = <class 'keras.src.utils.jax_layer_test.FlaxTrainingIndependentModel'>
+flax_model_method = 'forward', init_kwargs = {}, trainable_weights = 8
+trainable_params = 648226, non_trainable_weights = 0, non_trainable_params = 0
+
+    @parameterized.named_parameters(
+        {
+            "testcase_name": "training_independent_bound_method",
+            "flax_model_class": "FlaxTrainingIndependentModel",
+            "flax_model_method": "forward",
+            "init_kwargs": {},
+            "trainable_weights": 8,
+            "trainable_params": 648226,
+            "non_trainable_weights": 0,
+            "non_trainable_params": 0,
+        },
+        {
+            "testcase_name": "training_rng_unbound_method",
+            "flax_model_class": "FlaxDropoutModel",
+            "flax_model_method": None,
+            "init_kwargs": {
+                "method": "flax_dropout_wrapper",
+            },
+            "trainable_weights": 8,
+            "trainable_params": 648226,
+            "non_trainable_weights": 0,
+            "non_trainable_params": 0,
+        },
+        {
+            "testcase_name": "training_rng_state_no_method",
+            "flax_model_class": "FlaxBatchNormModel",
+            "flax_model_method": None,
+            "init_kwargs": {},
+            "trainable_weights": 13,
+            "trainable_params": 354258,
+            "non_trainable_weights": 8,
+            "non_trainable_params": 536,
+        },
+        {
+            "testcase_name": "training_rng_unbound_method_dtype_policy",
+            "flax_model_class": "FlaxDropoutModel",
+            "flax_model_method": None,
+            "init_kwargs": {
+                "method": "flax_dropout_wrapper",
+                "dtype": DTypePolicy("mixed_float16"),
+            },
+            "trainable_weights": 8,
+            "trainable_params": 648226,
+            "non_trainable_weights": 0,
+            "non_trainable_params": 0,
+        },
+    )
+    @pytest.mark.skipif(flax is None, reason="Flax library is not available.")
+    def test_flax_layer(
+        self,
+        flax_model_class,
+        flax_model_method,
+        init_kwargs,
+        trainable_weights,
+        trainable_params,
+        non_trainable_weights,
+        non_trainable_params,
+    ):
+        flax_model_class = FLAX_OBJECTS.get(flax_model_class)
+        if "method" in init_kwargs:
+            init_kwargs["method"] = FLAX_OBJECTS.get(init_kwargs["method"])
+    
+        def create_wrapper(**kwargs):
+            params = kwargs.pop("params") if "params" in kwargs else None
+            state = kwargs.pop("state") if "state" in kwargs else None
+            if params and state:
+                variables = {**params, **state}
+            elif params:
+                variables = params
+            elif state:
+                variables = state
+            else:
+                variables = None
+            kwargs["variables"] = variables
+            flax_model = flax_model_class()
+            if flax_model_method:
+                kwargs["method"] = getattr(flax_model, flax_model_method)
+            if backend.backend() == "jax":
+                return FlaxLayer(flax_model_class(), **kwargs)
+            elif backend.backend() == "tensorflow":
+                return FlaxLayer(flax_model, stateless_compute_output_shape, **kwargs)
+    
+    
+>       self._test_layer(
+            flax_model_class.__name__,
+            create_wrapper,
+            init_kwargs,
+            trainable_weights,
+            trainable_params,
+            non_trainable_weights,
+            non_trainable_params,
+        )
+
+keras/src/utils/jax_layer_test.py:497: 
+_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
+keras/src/utils/jax_layer_test.py:254: in _test_layer
+    model1.fit(x_train, y_train, epochs=1, steps_per_epoch=10)
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/backend/tensorflow/trainer.py:399: in fit
+    logs = self.train_function(iterator)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/backend/tensorflow/trainer.py:241: in function
+    opt_outputs = multi_step_on_iterator(iterator)
+                  ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
+    return func(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^
+keras/src/backend/tensorflow/trainer.py:154: in multi_step_on_iterator
+    one_step_on_data(iterator.get_next())
+keras/src/backend/tensorflow/trainer.py:125: in wrapper
+    result = step_func(converted_data)
+             ^^^^^^^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
+    return func(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^
+keras/src/backend/tensorflow/trainer.py:134: in one_step_on_data
+    outputs = self.distribute_strategy.run(step_function, args=(data,))
+              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:1673: in run
+    return self._extended.call_for_each_replica(fn, args=args, kwargs=kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:3263: in call_for_each_replica
+    return self._call_for_each_replica(fn, args, kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:4061: in _call_for_each_replica
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
+    return func(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^
+keras/src/backend/tensorflow/trainer.py:59: in train_step
+    y_pred = self(x, training=True)
+             ^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/layers/layer.py:941: in __call__
+    outputs = super().__call__(*args, **kwargs)
+              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/ops/operation.py:77: in __call__
+    return self.call(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/models/functional.py:183: in call
+    outputs = self._run_through_graph(
+keras/src/ops/function.py:206: in _run_through_graph
+    outputs = op(*args, **kwargs)
+              ^^^^^^^^^^^^^^^^^^^
+keras/src/models/functional.py:644: in call
+    return operation(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/layers/layer.py:941: in __call__
+    outputs = super().__call__(*args, **kwargs)
+              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/ops/operation.py:77: in __call__
+    return self.call(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/jax_layer.py:609: in call
+    return call_with_fn(self.jax2tf_training_false_fn)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/jax_layer.py:586: in call_with_fn
+    jax.tree_util.tree_map(
+_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
+
+f = <function JaxLayer.call.<locals>.assign_state_to_variable at 0x34ec467a0>
+tree = {}, is_leaf = None, rest = (DictWrapper({}),), leaves = []
+treedef = PyTreeDef({})
+
+    @export
+    def tree_map(f: Callable[..., Any],
+                 tree: Any,
+                 *rest: Any,
+                 is_leaf: Callable[[Any], bool] | None = None) -> Any:
+      """Alias of :func:`jax.tree.map`."""
+      leaves, treedef = tree_flatten(tree, is_leaf)
+>     all_leaves = [leaves] + [treedef.flatten_up_to(r) for r in rest]
+                               ^^^^^^^^^^^^^^^^^^^^^^^^
+E     ValueError: Expected dict, got DictWrapper({}).
+
+venv/lib/python3.12/site-packages/jax/_src/tree_util.py:357: ValueError
+----------------------------- Captured stdout call -----------------------------
+Model: "FlaxTrainingIndependentModel1"
+┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━┓
+┃ Layer (type)                    ┃ Output Shape           ┃       Param # ┃
+┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━┩
+│ input_layer (InputLayer)        │ (None, 28, 28, 1)      │             0 │
+├─────────────────────────────────┼────────────────────────┼───────────────┤
+│ flax_layer (FlaxLayer)          │ (None, 10)             │       648,226 │
+└─────────────────────────────────┴────────────────────────┴───────────────┘
+ Total params: 648,226 (2.47 MB)
+ Trainable params: 648,226 (2.47 MB)
+ Non-trainable params: 0 (0.00 B)
+----------------------------- Captured stderr call -----------------------------
+WARNING: All log messages before absl::InitializeLog() is called are written to STDERR
+I0000 00:00:1762560145.098912 1448076 service.cc:148] XLA service 0x11f0dbaf0 initialized for platform Host (this does not guarantee that XLA will be used). Devices:
+I0000 00:00:1762560145.098989 1448076 service.cc:156]   StreamExecutor device (0): Host, Default Version
+I0000 00:00:1762560145.119877 1448076 device_compiler.h:188] Compiled cluster using XLA!  This line is logged at most once for the lifetime of the process.
+__________ TestJaxLayer.test_flax_layer_training_rng_state_no_method ___________
+
+self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_flax_layer_training_rng_state_no_method>
+flax_model_class = <class 'keras.src.utils.jax_layer_test.FlaxBatchNormModel'>
+flax_model_method = None, init_kwargs = {}, trainable_weights = 13
+trainable_params = 354258, non_trainable_weights = 8, non_trainable_params = 536
+
+    @parameterized.named_parameters(
+        {
+            "testcase_name": "training_independent_bound_method",
+            "flax_model_class": "FlaxTrainingIndependentModel",
+            "flax_model_method": "forward",
+            "init_kwargs": {},
+            "trainable_weights": 8,
+            "trainable_params": 648226,
+            "non_trainable_weights": 0,
+            "non_trainable_params": 0,
+        },
+        {
+            "testcase_name": "training_rng_unbound_method",
+            "flax_model_class": "FlaxDropoutModel",
+            "flax_model_method": None,
+            "init_kwargs": {
+                "method": "flax_dropout_wrapper",
+            },
+            "trainable_weights": 8,
+            "trainable_params": 648226,
+            "non_trainable_weights": 0,
+            "non_trainable_params": 0,
+        },
+        {
+            "testcase_name": "training_rng_state_no_method",
+            "flax_model_class": "FlaxBatchNormModel",
+            "flax_model_method": None,
+            "init_kwargs": {},
+            "trainable_weights": 13,
+            "trainable_params": 354258,
+            "non_trainable_weights": 8,
+            "non_trainable_params": 536,
+        },
+        {
+            "testcase_name": "training_rng_unbound_method_dtype_policy",
+            "flax_model_class": "FlaxDropoutModel",
+            "flax_model_method": None,
+            "init_kwargs": {
+                "method": "flax_dropout_wrapper",
+                "dtype": DTypePolicy("mixed_float16"),
+            },
+            "trainable_weights": 8,
+            "trainable_params": 648226,
+            "non_trainable_weights": 0,
+            "non_trainable_params": 0,
+        },
+    )
+    @pytest.mark.skipif(flax is None, reason="Flax library is not available.")
+    def test_flax_layer(
+        self,
+        flax_model_class,
+        flax_model_method,
+        init_kwargs,
+        trainable_weights,
+        trainable_params,
+        non_trainable_weights,
+        non_trainable_params,
+    ):
+        flax_model_class = FLAX_OBJECTS.get(flax_model_class)
+        if "method" in init_kwargs:
+            init_kwargs["method"] = FLAX_OBJECTS.get(init_kwargs["method"])
+    
+        def create_wrapper(**kwargs):
+            params = kwargs.pop("params") if "params" in kwargs else None
+            state = kwargs.pop("state") if "state" in kwargs else None
+            if params and state:
+                variables = {**params, **state}
+            elif params:
+                variables = params
+            elif state:
+                variables = state
+            else:
+                variables = None
+            kwargs["variables"] = variables
+            flax_model = flax_model_class()
+            if flax_model_method:
+                kwargs["method"] = getattr(flax_model, flax_model_method)
+            if backend.backend() == "jax":
+                return FlaxLayer(flax_model_class(), **kwargs)
+            elif backend.backend() == "tensorflow":
+                return FlaxLayer(flax_model, stateless_compute_output_shape, **kwargs)
+    
+    
+>       self._test_layer(
+            flax_model_class.__name__,
+            create_wrapper,
+            init_kwargs,
+            trainable_weights,
+            trainable_params,
+            non_trainable_weights,
+            non_trainable_params,
+        )
+
+keras/src/utils/jax_layer_test.py:497: 
+_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
+keras/src/utils/jax_layer_test.py:254: in _test_layer
+    model1.fit(x_train, y_train, epochs=1, steps_per_epoch=10)
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/backend/tensorflow/trainer.py:399: in fit
+    logs = self.train_function(iterator)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/backend/tensorflow/trainer.py:241: in function
+    opt_outputs = multi_step_on_iterator(iterator)
+                  ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
+    return func(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^
+keras/src/backend/tensorflow/trainer.py:154: in multi_step_on_iterator
+    one_step_on_data(iterator.get_next())
+keras/src/backend/tensorflow/trainer.py:125: in wrapper
+    result = step_func(converted_data)
+             ^^^^^^^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
+    return func(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^
+keras/src/backend/tensorflow/trainer.py:134: in one_step_on_data
+    outputs = self.distribute_strategy.run(step_function, args=(data,))
+              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:1673: in run
+    return self._extended.call_for_each_replica(fn, args=args, kwargs=kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:3263: in call_for_each_replica
+    return self._call_for_each_replica(fn, args, kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:4061: in _call_for_each_replica
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
+    return func(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^
+keras/src/backend/tensorflow/trainer.py:59: in train_step
+    y_pred = self(x, training=True)
+             ^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/layers/layer.py:941: in __call__
+    outputs = super().__call__(*args, **kwargs)
+              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/ops/operation.py:77: in __call__
+    return self.call(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/models/functional.py:183: in call
+    outputs = self._run_through_graph(
+keras/src/ops/function.py:206: in _run_through_graph
+    outputs = op(*args, **kwargs)
+              ^^^^^^^^^^^^^^^^^^^
+keras/src/models/functional.py:644: in call
+    return operation(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/layers/layer.py:941: in __call__
+    outputs = super().__call__(*args, **kwargs)
+              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/ops/operation.py:77: in __call__
+    return self.call(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/jax_layer.py:612: in call
+    return call_with_fn(self.jax2tf_training_true_fn)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/jax_layer.py:586: in call_with_fn
+    jax.tree_util.tree_map(
+_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
+
+f = <function JaxLayer.call.<locals>.assign_state_to_variable at 0x36cc81580>
+tree = {'batch_stats': {'BatchNorm_0': {'mean': <tf.Tensor: shape=(12,), dtype=float32, numpy=
+array([-0.00319871, -0.0067011... , 0.997175  , 1.0033267 ,
+       0.99977   , 0.99732304, 1.0004325 , 0.99955   , 0.99559575],
+      dtype=float32)>}}}
+is_leaf = None
+rest = (DictWrapper({'batch_stats': DictWrapper({'BatchNorm_0': DictWrapper({'mean': <Variable path=flax_layer/variable_13, s...1. 1. 1. 1.
+ 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
+ 1. 1. 1. 1. 1. 1. 1. 1.]>})})}),)
+leaves = [<tf.Tensor: shape=(12,), dtype=float32, numpy=
+array([-0.00319871, -0.00670112, -0.0096636 , -0.00773753, -0.0039517 ...      0.9931413 , 0.9929665 , 0.99336755, 0.9929529 , 0.992772  ,
+       0.9927061 , 0.9929846 ], dtype=float32)>, ...]
+treedef = PyTreeDef({'batch_stats': {'BatchNorm_0': {'mean': *, 'var': *}, 'BatchNorm_1': {'mean': *, 'var': *}, 'BatchNorm_2': {'mean': *, 'var': *}, 'BatchNorm_3': {'mean': *, 'var': *}}})
+
+    @export
+    def tree_map(f: Callable[..., Any],
+                 tree: Any,
+                 *rest: Any,
+                 is_leaf: Callable[[Any], bool] | None = None) -> Any:
+      """Alias of :func:`jax.tree.map`."""
+      leaves, treedef = tree_flatten(tree, is_leaf)
+>     all_leaves = [leaves] + [treedef.flatten_up_to(r) for r in rest]
+                               ^^^^^^^^^^^^^^^^^^^^^^^^
+E     ValueError: Expected dict, got DictWrapper({'batch_stats': DictWrapper({'BatchNorm_0': DictWrapper({'mean': <Variable path=flax_layer/variable_13, shape=(12,), dtype=float32, value=[0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.]>, 'var': <Variable path=flax_layer/variable_14, shape=(12,), dtype=float32, value=[1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.]>}), 'BatchNorm_1': DictWrapper({'mean': <Variable path=flax_layer/variable_15, shape=(24,), dtype=float32, value=[0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.]>, 'var': <Variable path=flax_layer/variable_16, shape=(24,), dtype=float32, value=[1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.]>}), 'BatchNorm_2': DictWrapper({'mean': <Variable path=flax_layer/variable_17, shape=(32,), dtype=float32, value=[0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
+E      0. 0. 0. 0. 0. 0. 0. 0.]>, 'var': <Variable path=flax_layer/variable_18, shape=(32,), dtype=float32, value=[1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
+E      1. 1. 1. 1. 1. 1. 1. 1.]>}), 'BatchNorm_3': DictWrapper({'mean': <Variable path=flax_layer/variable_19, shape=(200,), dtype=float32, value=[0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
+E      0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
+E      0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
+E      0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
+E      0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
+E      0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
+E      0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
+E      0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
+E      0. 0. 0. 0. 0. 0. 0. 0.]>, 'var': <Variable path=flax_layer/variable_20, shape=(200,), dtype=float32, value=[1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
+E      1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
+E      1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
+E      1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
+E      1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
+E      1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
+E      1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
+E      1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
+E      1. 1. 1. 1. 1. 1. 1. 1.]>})})}).
+
+venv/lib/python3.12/site-packages/jax/_src/tree_util.py:357: ValueError
+----------------------------- Captured stdout call -----------------------------
+Model: "FlaxBatchNormModel1"
+┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━┓
+┃ Layer (type)                    ┃ Output Shape           ┃       Param # ┃
+┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━┩
+│ input_layer (InputLayer)        │ (None, 28, 28, 1)      │             0 │
+├─────────────────────────────────┼────────────────────────┼───────────────┤
+│ flax_layer (FlaxLayer)          │ (None, 10)             │       354,794 │
+└─────────────────────────────────┴────────────────────────┴───────────────┘
+ Total params: 354,794 (1.35 MB)
+ Trainable params: 354,258 (1.35 MB)
+ Non-trainable params: 536 (2.09 KB)
+___________ TestJaxLayer.test_flax_layer_training_rng_unbound_method ___________
+
+self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_flax_layer_training_rng_unbound_method>
+flax_model_class = <class 'keras.src.utils.jax_layer_test.FlaxDropoutModel'>
+flax_model_method = None
+init_kwargs = {'method': <function flax_dropout_wrapper at 0x16a760860>}
+trainable_weights = 8, trainable_params = 648226, non_trainable_weights = 0
+non_trainable_params = 0
+
+    @parameterized.named_parameters(
+        {
+            "testcase_name": "training_independent_bound_method",
+            "flax_model_class": "FlaxTrainingIndependentModel",
+            "flax_model_method": "forward",
+            "init_kwargs": {},
+            "trainable_weights": 8,
+            "trainable_params": 648226,
+            "non_trainable_weights": 0,
+            "non_trainable_params": 0,
+        },
+        {
+            "testcase_name": "training_rng_unbound_method",
+            "flax_model_class": "FlaxDropoutModel",
+            "flax_model_method": None,
+            "init_kwargs": {
+                "method": "flax_dropout_wrapper",
+            },
+            "trainable_weights": 8,
+            "trainable_params": 648226,
+            "non_trainable_weights": 0,
+            "non_trainable_params": 0,
+        },
+        {
+            "testcase_name": "training_rng_state_no_method",
+            "flax_model_class": "FlaxBatchNormModel",
+            "flax_model_method": None,
+            "init_kwargs": {},
+            "trainable_weights": 13,
+            "trainable_params": 354258,
+            "non_trainable_weights": 8,
+            "non_trainable_params": 536,
+        },
+        {
+            "testcase_name": "training_rng_unbound_method_dtype_policy",
+            "flax_model_class": "FlaxDropoutModel",
+            "flax_model_method": None,
+            "init_kwargs": {
+                "method": "flax_dropout_wrapper",
+                "dtype": DTypePolicy("mixed_float16"),
+            },
+            "trainable_weights": 8,
+            "trainable_params": 648226,
+            "non_trainable_weights": 0,
+            "non_trainable_params": 0,
+        },
+    )
+    @pytest.mark.skipif(flax is None, reason="Flax library is not available.")
+    def test_flax_layer(
+        self,
+        flax_model_class,
+        flax_model_method,
+        init_kwargs,
+        trainable_weights,
+        trainable_params,
+        non_trainable_weights,
+        non_trainable_params,
+    ):
+        flax_model_class = FLAX_OBJECTS.get(flax_model_class)
+        if "method" in init_kwargs:
+            init_kwargs["method"] = FLAX_OBJECTS.get(init_kwargs["method"])
+    
+        def create_wrapper(**kwargs):
+            params = kwargs.pop("params") if "params" in kwargs else None
+            state = kwargs.pop("state") if "state" in kwargs else None
+            if params and state:
+                variables = {**params, **state}
+            elif params:
+                variables = params
+            elif state:
+                variables = state
+            else:
+                variables = None
+            kwargs["variables"] = variables
+            flax_model = flax_model_class()
+            if flax_model_method:
+                kwargs["method"] = getattr(flax_model, flax_model_method)
+            if backend.backend() == "jax":
+                return FlaxLayer(flax_model_class(), **kwargs)
+            elif backend.backend() == "tensorflow":
+                return FlaxLayer(flax_model, stateless_compute_output_shape, **kwargs)
+    
+    
+>       self._test_layer(
+            flax_model_class.__name__,
+            create_wrapper,
+            init_kwargs,
+            trainable_weights,
+            trainable_params,
+            non_trainable_weights,
+            non_trainable_params,
+        )
+
+keras/src/utils/jax_layer_test.py:497: 
+_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
+keras/src/utils/jax_layer_test.py:254: in _test_layer
+    model1.fit(x_train, y_train, epochs=1, steps_per_epoch=10)
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/backend/tensorflow/trainer.py:399: in fit
+    logs = self.train_function(iterator)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/backend/tensorflow/trainer.py:241: in function
+    opt_outputs = multi_step_on_iterator(iterator)
+                  ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
+    return func(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^
+keras/src/backend/tensorflow/trainer.py:154: in multi_step_on_iterator
+    one_step_on_data(iterator.get_next())
+keras/src/backend/tensorflow/trainer.py:125: in wrapper
+    result = step_func(converted_data)
+             ^^^^^^^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
+    return func(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^
+keras/src/backend/tensorflow/trainer.py:134: in one_step_on_data
+    outputs = self.distribute_strategy.run(step_function, args=(data,))
+              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:1673: in run
+    return self._extended.call_for_each_replica(fn, args=args, kwargs=kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:3263: in call_for_each_replica
+    return self._call_for_each_replica(fn, args, kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:4061: in _call_for_each_replica
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
+    return func(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^
+keras/src/backend/tensorflow/trainer.py:59: in train_step
+    y_pred = self(x, training=True)
+             ^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/layers/layer.py:941: in __call__
+    outputs = super().__call__(*args, **kwargs)
+              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/ops/operation.py:77: in __call__
+    return self.call(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/models/functional.py:183: in call
+    outputs = self._run_through_graph(
+keras/src/ops/function.py:206: in _run_through_graph
+    outputs = op(*args, **kwargs)
+              ^^^^^^^^^^^^^^^^^^^
+keras/src/models/functional.py:644: in call
+    return operation(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/layers/layer.py:941: in __call__
+    outputs = super().__call__(*args, **kwargs)
+              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/ops/operation.py:77: in __call__
+    return self.call(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/jax_layer.py:612: in call
+    return call_with_fn(self.jax2tf_training_true_fn)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/jax_layer.py:586: in call_with_fn
+    jax.tree_util.tree_map(
+_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
+
+f = <function JaxLayer.call.<locals>.assign_state_to_variable at 0x36e4ebb00>
+tree = {}, is_leaf = None, rest = (DictWrapper({}),), leaves = []
+treedef = PyTreeDef({})
+
+    @export
+    def tree_map(f: Callable[..., Any],
+                 tree: Any,
+                 *rest: Any,
+                 is_leaf: Callable[[Any], bool] | None = None) -> Any:
+      """Alias of :func:`jax.tree.map`."""
+      leaves, treedef = tree_flatten(tree, is_leaf)
+>     all_leaves = [leaves] + [treedef.flatten_up_to(r) for r in rest]
+                               ^^^^^^^^^^^^^^^^^^^^^^^^
+E     ValueError: Expected dict, got DictWrapper({}).
+
+venv/lib/python3.12/site-packages/jax/_src/tree_util.py:357: ValueError
+----------------------------- Captured stdout call -----------------------------
+Model: "FlaxDropoutModel1"
+┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━┓
+┃ Layer (type)                    ┃ Output Shape           ┃       Param # ┃
+┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━┩
+│ input_layer (InputLayer)        │ (None, 28, 28, 1)      │             0 │
+├─────────────────────────────────┼────────────────────────┼───────────────┤
+│ flax_layer (FlaxLayer)          │ (None, 10)             │       648,226 │
+└─────────────────────────────────┴────────────────────────┴───────────────┘
+ Total params: 648,226 (2.47 MB)
+ Trainable params: 648,226 (2.47 MB)
+ Non-trainable params: 0 (0.00 B)
+____ TestJaxLayer.test_flax_layer_training_rng_unbound_method_dtype_policy _____
+
+self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_flax_layer_training_rng_unbound_method_dtype_policy>
+flax_model_class = <class 'keras.src.utils.jax_layer_test.FlaxDropoutModel'>
+flax_model_method = None
+init_kwargs = {'dtype': <DTypePolicy "mixed_float16">, 'method': <function flax_dropout_wrapper at 0x16a760860>}
+trainable_weights = 8, trainable_params = 648226, non_trainable_weights = 0
+non_trainable_params = 0
+
+    @parameterized.named_parameters(
+        {
+            "testcase_name": "training_independent_bound_method",
+            "flax_model_class": "FlaxTrainingIndependentModel",
+            "flax_model_method": "forward",
+            "init_kwargs": {},
+            "trainable_weights": 8,
+            "trainable_params": 648226,
+            "non_trainable_weights": 0,
+            "non_trainable_params": 0,
+        },
+        {
+            "testcase_name": "training_rng_unbound_method",
+            "flax_model_class": "FlaxDropoutModel",
+            "flax_model_method": None,
+            "init_kwargs": {
+                "method": "flax_dropout_wrapper",
+            },
+            "trainable_weights": 8,
+            "trainable_params": 648226,
+            "non_trainable_weights": 0,
+            "non_trainable_params": 0,
+        },
+        {
+            "testcase_name": "training_rng_state_no_method",
+            "flax_model_class": "FlaxBatchNormModel",
+            "flax_model_method": None,
+            "init_kwargs": {},
+            "trainable_weights": 13,
+            "trainable_params": 354258,
+            "non_trainable_weights": 8,
+            "non_trainable_params": 536,
+        },
+        {
+            "testcase_name": "training_rng_unbound_method_dtype_policy",
+            "flax_model_class": "FlaxDropoutModel",
+            "flax_model_method": None,
+            "init_kwargs": {
+                "method": "flax_dropout_wrapper",
+                "dtype": DTypePolicy("mixed_float16"),
+            },
+            "trainable_weights": 8,
+            "trainable_params": 648226,
+            "non_trainable_weights": 0,
+            "non_trainable_params": 0,
+        },
+    )
+    @pytest.mark.skipif(flax is None, reason="Flax library is not available.")
+    def test_flax_layer(
+        self,
+        flax_model_class,
+        flax_model_method,
+        init_kwargs,
+        trainable_weights,
+        trainable_params,
+        non_trainable_weights,
+        non_trainable_params,
+    ):
+        flax_model_class = FLAX_OBJECTS.get(flax_model_class)
+        if "method" in init_kwargs:
+            init_kwargs["method"] = FLAX_OBJECTS.get(init_kwargs["method"])
+    
+        def create_wrapper(**kwargs):
+            params = kwargs.pop("params") if "params" in kwargs else None
+            state = kwargs.pop("state") if "state" in kwargs else None
+            if params and state:
+                variables = {**params, **state}
+            elif params:
+                variables = params
+            elif state:
+                variables = state
+            else:
+                variables = None
+            kwargs["variables"] = variables
+            flax_model = flax_model_class()
+            if flax_model_method:
+                kwargs["method"] = getattr(flax_model, flax_model_method)
+            if backend.backend() == "jax":
+                return FlaxLayer(flax_model_class(), **kwargs)
+            elif backend.backend() == "tensorflow":
+                return FlaxLayer(flax_model, stateless_compute_output_shape, **kwargs)
+    
+    
+>       self._test_layer(
+            flax_model_class.__name__,
+            create_wrapper,
+            init_kwargs,
+            trainable_weights,
+            trainable_params,
+            non_trainable_weights,
+            non_trainable_params,
+        )
+
+keras/src/utils/jax_layer_test.py:497: 
+_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
+keras/src/utils/jax_layer_test.py:254: in _test_layer
+    model1.fit(x_train, y_train, epochs=1, steps_per_epoch=10)
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/backend/tensorflow/trainer.py:399: in fit
+    logs = self.train_function(iterator)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/backend/tensorflow/trainer.py:241: in function
+    opt_outputs = multi_step_on_iterator(iterator)
+                  ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
+    return func(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^
+keras/src/backend/tensorflow/trainer.py:154: in multi_step_on_iterator
+    one_step_on_data(iterator.get_next())
+keras/src/backend/tensorflow/trainer.py:125: in wrapper
+    result = step_func(converted_data)
+             ^^^^^^^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
+    return func(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^
+keras/src/backend/tensorflow/trainer.py:134: in one_step_on_data
+    outputs = self.distribute_strategy.run(step_function, args=(data,))
+              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:1673: in run
+    return self._extended.call_for_each_replica(fn, args=args, kwargs=kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:3263: in call_for_each_replica
+    return self._call_for_each_replica(fn, args, kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:4061: in _call_for_each_replica
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
+    return func(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^
+keras/src/backend/tensorflow/trainer.py:59: in train_step
+    y_pred = self(x, training=True)
+             ^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/layers/layer.py:941: in __call__
+    outputs = super().__call__(*args, **kwargs)
+              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/ops/operation.py:77: in __call__
+    return self.call(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/models/functional.py:183: in call
+    outputs = self._run_through_graph(
+keras/src/ops/function.py:206: in _run_through_graph
+    outputs = op(*args, **kwargs)
+              ^^^^^^^^^^^^^^^^^^^
+keras/src/models/functional.py:644: in call
+    return operation(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/layers/layer.py:939: in __call__
+    outputs = super().__call__(*args, **kwargs)
+              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/ops/operation.py:77: in __call__
+    return self.call(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/jax_layer.py:612: in call
+    return call_with_fn(self.jax2tf_training_true_fn)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/jax_layer.py:586: in call_with_fn
+    jax.tree_util.tree_map(
+_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
+
+f = <function JaxLayer.call.<locals>.assign_state_to_variable at 0x36e43ad40>
+tree = {}, is_leaf = None, rest = (DictWrapper({}),), leaves = []
+treedef = PyTreeDef({})
+
+    @export
+    def tree_map(f: Callable[..., Any],
+                 tree: Any,
+                 *rest: Any,
+                 is_leaf: Callable[[Any], bool] | None = None) -> Any:
+      """Alias of :func:`jax.tree.map`."""
+      leaves, treedef = tree_flatten(tree, is_leaf)
+>     all_leaves = [leaves] + [treedef.flatten_up_to(r) for r in rest]
+                               ^^^^^^^^^^^^^^^^^^^^^^^^
+E     ValueError: Expected dict, got DictWrapper({}).
+
+venv/lib/python3.12/site-packages/jax/_src/tree_util.py:357: ValueError
+----------------------------- Captured stdout call -----------------------------
+Model: "FlaxDropoutModel1"
+┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━┓
+┃ Layer (type)                    ┃ Output Shape           ┃       Param # ┃
+┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━┩
+│ input_layer (InputLayer)        │ (None, 28, 28, 1)      │             0 │
+├─────────────────────────────────┼────────────────────────┼───────────────┤
+│ flax_layer (FlaxLayer)          │ (None, 10)             │       648,226 │
+└─────────────────────────────────┴────────────────────────┴───────────────┘
+ Total params: 648,226 (2.47 MB)
+ Trainable params: 648,226 (2.47 MB)
+ Non-trainable params: 0 (0.00 B)
+__ TestJaxLayer.test_state_mismatch_during_update_mapping_instead_of_sequence __
+ValueError: Expected dict, got DictWrapper({'state': DictWrapper({'foo': <Variable path=jax_layer/variable, shape=(), dtype=float32, value=0.0>})}).
+
+During handling of the above exception, another exception occurred:
+
+self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_state_mismatch_during_update_mapping_instead_of_sequence>
+init_state = {'state': {'foo': 0.0}}, error_regex = 'Structure mismatch'
+
+    @parameterized.named_parameters(
+        {
+            "testcase_name": "sequence_instead_of_mapping",
+            "init_state": [0.0],
+            "error_regex": "Structure mismatch",
+        },
+        {
+            "testcase_name": "mapping_instead_of_sequence",
+            "init_state": {"state": {"foo": 0.0}},
+            "error_regex": "Structure mismatch",
+        },
+        {
+            "testcase_name": "sequence_instead_of_variable",
+            "init_state": {"state": [[0.0]]},
+            "error_regex": "Structure mismatch",
+        },
+        {
+            "testcase_name": "no_initial_state",
+            "init_state": None,
+            "error_regex": "Structure mismatch",
+        },
+        {
+            "testcase_name": "missing_dict_key",
+            "init_state": {"state": {}},
+            "error_regex": "Structure mismatch ",
+        },
+        {
+            "testcase_name": "missing_variable_in_list",
+            "init_state": {"state": {"foo": [2.0]}},
+            "error_regex": "Structure mismatch",
+        },
+    )
+    def test_state_mismatch_during_update(self, init_state, error_regex):
+        def jax_fn(params, state, inputs):
+            return inputs, {"state": [jnp.ones([])]}
+    
+        layer = JaxLayer(jax_fn, params={}, state=init_state)
+>       with self.assertRaisesRegex(ValueError, error_regex):
+             ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+E       AssertionError: "Structure mismatch" does not match "Expected dict, got DictWrapper({'state': DictWrapper({'foo': <Variable path=jax_layer/variable, shape=(), dtype=float32, value=0.0>})})."
+
+keras/src/utils/jax_layer_test.py:712: AssertionError
+_______ TestJaxLayer.test_state_mismatch_during_update_missing_dict_key ________
+ValueError: Expected dict, got DictWrapper({'state': DictWrapper({})}).
+
+During handling of the above exception, another exception occurred:
+
+self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_state_mismatch_during_update_missing_dict_key>
+init_state = {'state': {}}, error_regex = 'Structure mismatch '
+
+    @parameterized.named_parameters(
+        {
+            "testcase_name": "sequence_instead_of_mapping",
+            "init_state": [0.0],
+            "error_regex": "Structure mismatch",
+        },
+        {
+            "testcase_name": "mapping_instead_of_sequence",
+            "init_state": {"state": {"foo": 0.0}},
+            "error_regex": "Structure mismatch",
+        },
+        {
+            "testcase_name": "sequence_instead_of_variable",
+            "init_state": {"state": [[0.0]]},
+            "error_regex": "Structure mismatch",
+        },
+        {
+            "testcase_name": "no_initial_state",
+            "init_state": None,
+            "error_regex": "Structure mismatch",
+        },
+        {
+            "testcase_name": "missing_dict_key",
+            "init_state": {"state": {}},
+            "error_regex": "Structure mismatch ",
+        },
+        {
+            "testcase_name": "missing_variable_in_list",
+            "init_state": {"state": {"foo": [2.0]}},
+            "error_regex": "Structure mismatch",
+        },
+    )
+    def test_state_mismatch_during_update(self, init_state, error_regex):
+        def jax_fn(params, state, inputs):
+            return inputs, {"state": [jnp.ones([])]}
+    
+        layer = JaxLayer(jax_fn, params={}, state=init_state)
+>       with self.assertRaisesRegex(ValueError, error_regex):
+             ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+E       AssertionError: "Structure mismatch " does not match "Expected dict, got DictWrapper({'state': DictWrapper({})})."
+
+keras/src/utils/jax_layer_test.py:712: AssertionError
+___ TestJaxLayer.test_state_mismatch_during_update_missing_variable_in_list ____
+ValueError: Expected dict, got DictWrapper({'state': DictWrapper({'foo': ListWrapper([<Variable path=jax_layer/variable, shape=(), dtype=float32, value=2.0>])})}).
+
+During handling of the above exception, another exception occurred:
+
+self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_state_mismatch_during_update_missing_variable_in_list>
+init_state = {'state': {'foo': [2.0]}}, error_regex = 'Structure mismatch'
+
+    @parameterized.named_parameters(
+        {
+            "testcase_name": "sequence_instead_of_mapping",
+            "init_state": [0.0],
+            "error_regex": "Structure mismatch",
+        },
+        {
+            "testcase_name": "mapping_instead_of_sequence",
+            "init_state": {"state": {"foo": 0.0}},
+            "error_regex": "Structure mismatch",
+        },
+        {
+            "testcase_name": "sequence_instead_of_variable",
+            "init_state": {"state": [[0.0]]},
+            "error_regex": "Structure mismatch",
+        },
+        {
+            "testcase_name": "no_initial_state",
+            "init_state": None,
+            "error_regex": "Structure mismatch",
+        },
+        {
+            "testcase_name": "missing_dict_key",
+            "init_state": {"state": {}},
+            "error_regex": "Structure mismatch ",
+        },
+        {
+            "testcase_name": "missing_variable_in_list",
+            "init_state": {"state": {"foo": [2.0]}},
+            "error_regex": "Structure mismatch",
+        },
+    )
+    def test_state_mismatch_during_update(self, init_state, error_regex):
+        def jax_fn(params, state, inputs):
+            return inputs, {"state": [jnp.ones([])]}
+    
+        layer = JaxLayer(jax_fn, params={}, state=init_state)
+>       with self.assertRaisesRegex(ValueError, error_regex):
+             ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+E       AssertionError: "Structure mismatch" does not match "Expected dict, got DictWrapper({'state': DictWrapper({'foo': ListWrapper([<Variable path=jax_layer/variable, shape=(), dtype=float32, value=2.0>])})})."
+
+keras/src/utils/jax_layer_test.py:712: AssertionError
+_______ TestJaxLayer.test_state_mismatch_during_update_no_initial_state ________
+ValueError: Expected dict, got None.
+
+During handling of the above exception, another exception occurred:
+
+self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_state_mismatch_during_update_no_initial_state>
+init_state = None, error_regex = 'Structure mismatch'
+
+    @parameterized.named_parameters(
+        {
+            "testcase_name": "sequence_instead_of_mapping",
+            "init_state": [0.0],
+            "error_regex": "Structure mismatch",
+        },
+        {
+            "testcase_name": "mapping_instead_of_sequence",
+            "init_state": {"state": {"foo": 0.0}},
+            "error_regex": "Structure mismatch",
+        },
+        {
+            "testcase_name": "sequence_instead_of_variable",
+            "init_state": {"state": [[0.0]]},
+            "error_regex": "Structure mismatch",
+        },
+        {
+            "testcase_name": "no_initial_state",
+            "init_state": None,
+            "error_regex": "Structure mismatch",
+        },
+        {
+            "testcase_name": "missing_dict_key",
+            "init_state": {"state": {}},
+            "error_regex": "Structure mismatch ",
+        },
+        {
+            "testcase_name": "missing_variable_in_list",
+            "init_state": {"state": {"foo": [2.0]}},
+            "error_regex": "Structure mismatch",
+        },
+    )
+    def test_state_mismatch_during_update(self, init_state, error_regex):
+        def jax_fn(params, state, inputs):
+            return inputs, {"state": [jnp.ones([])]}
+    
+        layer = JaxLayer(jax_fn, params={}, state=init_state)
+>       with self.assertRaisesRegex(ValueError, error_regex):
+             ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+E       AssertionError: "Structure mismatch" does not match "Expected dict, got None."
+
+keras/src/utils/jax_layer_test.py:712: AssertionError
+__ TestJaxLayer.test_state_mismatch_during_update_sequence_instead_of_mapping __
+ValueError: Expected dict, got ListWrapper([<Variable path=jax_layer/variable, shape=(), dtype=float32, value=0.0>]).
+
+During handling of the above exception, another exception occurred:
+
+self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_state_mismatch_during_update_sequence_instead_of_mapping>
+init_state = [0.0], error_regex = 'Structure mismatch'
+
+    @parameterized.named_parameters(
+        {
+            "testcase_name": "sequence_instead_of_mapping",
+            "init_state": [0.0],
+            "error_regex": "Structure mismatch",
+        },
+        {
+            "testcase_name": "mapping_instead_of_sequence",
+            "init_state": {"state": {"foo": 0.0}},
+            "error_regex": "Structure mismatch",
+        },
+        {
+            "testcase_name": "sequence_instead_of_variable",
+            "init_state": {"state": [[0.0]]},
+            "error_regex": "Structure mismatch",
+        },
+        {
+            "testcase_name": "no_initial_state",
+            "init_state": None,
+            "error_regex": "Structure mismatch",
+        },
+        {
+            "testcase_name": "missing_dict_key",
+            "init_state": {"state": {}},
+            "error_regex": "Structure mismatch ",
+        },
+        {
+            "testcase_name": "missing_variable_in_list",
+            "init_state": {"state": {"foo": [2.0]}},
+            "error_regex": "Structure mismatch",
+        },
+    )
+    def test_state_mismatch_during_update(self, init_state, error_regex):
+        def jax_fn(params, state, inputs):
+            return inputs, {"state": [jnp.ones([])]}
+    
+        layer = JaxLayer(jax_fn, params={}, state=init_state)
+>       with self.assertRaisesRegex(ValueError, error_regex):
+             ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+E       AssertionError: "Structure mismatch" does not match "Expected dict, got ListWrapper([<Variable path=jax_layer/variable, shape=(), dtype=float32, value=0.0>])."
+
+keras/src/utils/jax_layer_test.py:712: AssertionError
+_ TestJaxLayer.test_state_mismatch_during_update_sequence_instead_of_variable __
+ValueError: Expected dict, got DictWrapper({'state': ListWrapper([ListWrapper([<Variable path=jax_layer/variable, shape=(), dtype=float32, value=0.0>])])}).
+
+During handling of the above exception, another exception occurred:
+
+self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_state_mismatch_during_update_sequence_instead_of_variable>
+init_state = {'state': [[0.0]]}, error_regex = 'Structure mismatch'
+
+    @parameterized.named_parameters(
+        {
+            "testcase_name": "sequence_instead_of_mapping",
+            "init_state": [0.0],
+            "error_regex": "Structure mismatch",
+        },
+        {
+            "testcase_name": "mapping_instead_of_sequence",
+            "init_state": {"state": {"foo": 0.0}},
+            "error_regex": "Structure mismatch",
+        },
+        {
+            "testcase_name": "sequence_instead_of_variable",
+            "init_state": {"state": [[0.0]]},
+            "error_regex": "Structure mismatch",
+        },
+        {
+            "testcase_name": "no_initial_state",
+            "init_state": None,
+            "error_regex": "Structure mismatch",
+        },
+        {
+            "testcase_name": "missing_dict_key",
+            "init_state": {"state": {}},
+            "error_regex": "Structure mismatch ",
+        },
+        {
+            "testcase_name": "missing_variable_in_list",
+            "init_state": {"state": {"foo": [2.0]}},
+            "error_regex": "Structure mismatch",
+        },
+    )
+    def test_state_mismatch_during_update(self, init_state, error_regex):
+        def jax_fn(params, state, inputs):
+            return inputs, {"state": [jnp.ones([])]}
+    
+        layer = JaxLayer(jax_fn, params={}, state=init_state)
+>       with self.assertRaisesRegex(ValueError, error_regex):
+             ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+E       AssertionError: "Structure mismatch" does not match "Expected dict, got DictWrapper({'state': ListWrapper([ListWrapper([<Variable path=jax_layer/variable, shape=(), dtype=float32, value=0.0>])])})."
+
+keras/src/utils/jax_layer_test.py:712: AssertionError
+_______________ TestJaxLayer.test_with_different_argument_order ________________
+
+self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_with_different_argument_order>
+
+    def test_with_different_argument_order(self):
+        def jax_call_fn(training, inputs, rng, state, params):
+            return inputs, {}
+    
+        def jax_init_fn(training, inputs, rng):
+            return {}, {}
+    
+        layer = JaxLayer(jax_call_fn, jax_init_fn)
+>       layer(np.ones((1,)))
+
+keras/src/utils/jax_layer_test.py:532: 
+_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/layers/layer.py:941: in __call__
+    outputs = super().__call__(*args, **kwargs)
+              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/ops/operation.py:77: in __call__
+    return self.call(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/jax_layer.py:614: in call
+    return call_with_fn(self.jax2tf_training_false_fn)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/jax_layer.py:586: in call_with_fn
+    jax.tree_util.tree_map(
+_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
+
+f = <function JaxLayer.call.<locals>.assign_state_to_variable at 0x393b49940>
+tree = {}, is_leaf = None, rest = (DictWrapper({}),), leaves = []
+treedef = PyTreeDef({})
+
+    @export
+    def tree_map(f: Callable[..., Any],
+                 tree: Any,
+                 *rest: Any,
+                 is_leaf: Callable[[Any], bool] | None = None) -> Any:
+      """Alias of :func:`jax.tree.map`."""
+      leaves, treedef = tree_flatten(tree, is_leaf)
+>     all_leaves = [leaves] + [treedef.flatten_up_to(r) for r in rest]
+                               ^^^^^^^^^^^^^^^^^^^^^^^^
+E     ValueError: Expected dict, got DictWrapper({}).
+
+venv/lib/python3.12/site-packages/jax/_src/tree_util.py:357: ValueError
+_________________ TestJaxLayer.test_with_flax_state_no_params __________________
+
+self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_with_flax_state_no_params>
+
+    @pytest.mark.skipif(flax is None, reason="Flax library is not available.")
+    def test_with_flax_state_no_params(self):
+        class MyFlaxLayer(flax.linen.Module):
+            @flax.linen.compact
+            def __call__(self, x):
+                def zeros_init(shape):
+                    return jnp.zeros(shape, jnp.int32)
+    
+                count = self.variable("a", "b", zeros_init, [])
+                count.value = count.value + 1
+                return x
+    
+        layer = FlaxLayer(MyFlaxLayer(), variables={"a": {"b": 0}})
+>       layer(np.ones((1,)))
+
+keras/src/utils/jax_layer_test.py:634: 
+_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/layers/layer.py:941: in __call__
+    outputs = super().__call__(*args, **kwargs)
+              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/ops/operation.py:77: in __call__
+    return self.call(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/jax_layer.py:609: in call
+    return call_with_fn(self.jax2tf_training_false_fn)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/jax_layer.py:586: in call_with_fn
+    jax.tree_util.tree_map(
+_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
+
+f = <function JaxLayer.call.<locals>.assign_state_to_variable at 0x393b7aa20>
+tree = {'a': {'b': <tf.Tensor: shape=(), dtype=int32, numpy=1>}}, is_leaf = None
+rest = (DictWrapper({'a': DictWrapper({'b': <Variable path=flax_layer/variable, shape=(), dtype=int64, value=0>})}),)
+leaves = [<tf.Tensor: shape=(), dtype=int32, numpy=1>]
+treedef = PyTreeDef({'a': {'b': *}})
+
+    @export
+    def tree_map(f: Callable[..., Any],
+                 tree: Any,
+                 *rest: Any,
+                 is_leaf: Callable[[Any], bool] | None = None) -> Any:
+      """Alias of :func:`jax.tree.map`."""
+      leaves, treedef = tree_flatten(tree, is_leaf)
+>     all_leaves = [leaves] + [treedef.flatten_up_to(r) for r in rest]
+                               ^^^^^^^^^^^^^^^^^^^^^^^^
+E     ValueError: Expected dict, got DictWrapper({'a': DictWrapper({'b': <Variable path=flax_layer/variable, shape=(), dtype=int64, value=0>})}).
+
+venv/lib/python3.12/site-packages/jax/_src/tree_util.py:357: ValueError
+____________ TestJaxLayer.test_with_state_jax_registered_node_class ____________
+
+self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_with_state_jax_registered_node_class>
+
+    def test_with_state_jax_registered_node_class(self):
+        @jax.tree_util.register_pytree_node_class
+        class NamedPoint:
+            def __init__(self, x, y, name):
+                self.x = x
+                self.y = y
+                self.name = name
+    
+            def tree_flatten(self):
+                return ((self.x, self.y), self.name)
+    
+            @classmethod
+            def tree_unflatten(cls, aux_data, children):
+                return cls(*children, aux_data)
+    
+        def jax_fn(params, state, inputs):
+            return inputs, state
+    
+        layer = JaxLayer(jax_fn, state=[NamedPoint(1.0, 2.0, "foo")])
+>       layer(np.ones((1,)))
+
+keras/src/utils/jax_layer_test.py:673: 
+_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/layers/layer.py:941: in __call__
+    outputs = super().__call__(*args, **kwargs)
+              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/ops/operation.py:77: in __call__
+    return self.call(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/jax_layer.py:609: in call
+    return call_with_fn(self.jax2tf_training_false_fn)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/jax_layer.py:586: in call_with_fn
+    jax.tree_util.tree_map(
+_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
+
+f = <function JaxLayer.call.<locals>.assign_state_to_variable at 0x395be4680>
+tree = [<keras.src.utils.jax_layer_test.TestJaxLayer.test_with_state_jax_registered_node_class.<locals>.NamedPoint object at 0x396832d50>]
+is_leaf = None
+rest = (ListWrapper([<keras.src.utils.jax_layer_test.TestJaxLayer.test_with_state_jax_registered_node_class.<locals>.NamedPoint object at 0x3923390a0>]),)
+leaves = [<tf.Tensor: shape=(), dtype=float32, numpy=1.0>, <tf.Tensor: shape=(), dtype=float32, numpy=2.0>]
+treedef = PyTreeDef([CustomNode(NamedPoint[foo], [*, *])])
+
+    @export
+    def tree_map(f: Callable[..., Any],
+                 tree: Any,
+                 *rest: Any,
+                 is_leaf: Callable[[Any], bool] | None = None) -> Any:
+      """Alias of :func:`jax.tree.map`."""
+      leaves, treedef = tree_flatten(tree, is_leaf)
+>     all_leaves = [leaves] + [treedef.flatten_up_to(r) for r in rest]
+                               ^^^^^^^^^^^^^^^^^^^^^^^^
+E     ValueError: Expected list, got ListWrapper([<keras.src.utils.jax_layer_test.TestJaxLayer.test_with_state_jax_registered_node_class.<locals>.NamedPoint object at 0x3923390a0>]).
+
+venv/lib/python3.12/site-packages/jax/_src/tree_util.py:357: ValueError
+__________ TestJaxLayer.test_with_training_in_call_fn_but_not_init_fn __________
+
+self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_with_training_in_call_fn_but_not_init_fn>
+
+    def test_with_training_in_call_fn_but_not_init_fn(self):
+        def jax_call_fn(params, state, rng, inputs, training):
+            return inputs, {}
+    
+        def jax_init_fn(rng, inputs):
+            return {}, {}
+    
+        layer = JaxLayer(jax_call_fn, jax_init_fn)
+>       layer(np.ones((1,)))
+
+keras/src/utils/jax_layer_test.py:522: 
+_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/layers/layer.py:941: in __call__
+    outputs = super().__call__(*args, **kwargs)
+              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/ops/operation.py:77: in __call__
+    return self.call(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/jax_layer.py:614: in call
+    return call_with_fn(self.jax2tf_training_false_fn)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/jax_layer.py:586: in call_with_fn
+    jax.tree_util.tree_map(
+_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
+
+f = <function JaxLayer.call.<locals>.assign_state_to_variable at 0x395b993a0>
+tree = {}, is_leaf = None, rest = (DictWrapper({}),), leaves = []
+treedef = PyTreeDef({})
+
+    @export
+    def tree_map(f: Callable[..., Any],
+                 tree: Any,
+                 *rest: Any,
+                 is_leaf: Callable[[Any], bool] | None = None) -> Any:
+      """Alias of :func:`jax.tree.map`."""
+      leaves, treedef = tree_flatten(tree, is_leaf)
+>     all_leaves = [leaves] + [treedef.flatten_up_to(r) for r in rest]
+                               ^^^^^^^^^^^^^^^^^^^^^^^^
+E     ValueError: Expected dict, got DictWrapper({}).
+
+venv/lib/python3.12/site-packages/jax/_src/tree_util.py:357: ValueError
+=========================== short test summary info ============================
+FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_flax_layer_training_independent_bound_method - ValueError: Expected dict, got DictWrapper({}).
+FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_flax_layer_training_rng_state_no_method - ValueError: Expected dict, got DictWrapper({'batch_stats': DictWrapper({'BatchNorm_0': DictWrapper({'mean': <Variable path=flax_layer/variable_13, shape=(12,), dtype=float32, value=[0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.]>, 'var': <Variable path=flax_layer/variable_14, shape=(12,), dtype=float32, value=[1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.]>}), 'BatchNorm_1': DictWrapper({'mean': <Variable path=flax_layer/variable_15, shape=(24,), dtype=float32, value=[0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.]>, 'var': <Variable path=flax_layer/variable_16, shape=(24,), dtype=float32, value=[1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.]>}), 'BatchNorm_2': DictWrapper({'mean': <Variable path=flax_layer/variable_17, shape=(32,), dtype=float32, value=[0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
+ 0. 0. 0. 0. 0. 0. 0. 0.]>, 'var': <Variable path=flax_layer/variable_18, shape=(32,), dtype=float32, value=[1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
+ 1. 1. 1. 1. 1. 1. 1. 1.]>}), 'BatchNorm_3': DictWrapper({'mean': <Variable path=flax_layer/variable_19, shape=(200,), dtype=float32, value=[0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
+ 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
+ 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
+ 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
+ 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
+ 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
+ 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
+ 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
+ 0. 0. 0. 0. 0. 0. 0. 0.]>, 'var': <Variable path=flax_layer/variable_20, shape=(200,), dtype=float32, value=[1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
+ 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
+ 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
+ 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
+ 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
+ 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
+ 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
+ 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
+ 1. 1. 1. 1. 1. 1. 1. 1.]>})})}).
+FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_flax_layer_training_rng_unbound_method - ValueError: Expected dict, got DictWrapper({}).
+FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_flax_layer_training_rng_unbound_method_dtype_policy - ValueError: Expected dict, got DictWrapper({}).
+FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_state_mismatch_during_update_mapping_instead_of_sequence - AssertionError: "Structure mismatch" does not match "Expected dict, got DictWrapper({'state': DictWrapper({'foo': <Variable path=jax_layer/variable, shape=(), dtype=float32, value=0.0>})})."
+FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_state_mismatch_during_update_missing_dict_key - AssertionError: "Structure mismatch " does not match "Expected dict, got DictWrapper({'state': DictWrapper({})})."
+FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_state_mismatch_during_update_missing_variable_in_list - AssertionError: "Structure mismatch" does not match "Expected dict, got DictWrapper({'state': DictWrapper({'foo': ListWrapper([<Variable path=jax_layer/variable, shape=(), dtype=float32, value=2.0>])})})."
+FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_state_mismatch_during_update_no_initial_state - AssertionError: "Structure mismatch" does not match "Expected dict, got None."
+FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_state_mismatch_during_update_sequence_instead_of_mapping - AssertionError: "Structure mismatch" does not match "Expected dict, got ListWrapper([<Variable path=jax_layer/variable, shape=(), dtype=float32, value=0.0>])."
+FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_state_mismatch_during_update_sequence_instead_of_variable - AssertionError: "Structure mismatch" does not match "Expected dict, got DictWrapper({'state': ListWrapper([ListWrapper([<Variable path=jax_layer/variable, shape=(), dtype=float32, value=0.0>])])})."
+FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_different_argument_order - ValueError: Expected dict, got DictWrapper({}).
+FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_flax_state_no_params - ValueError: Expected dict, got DictWrapper({'a': DictWrapper({'b': <Variable path=flax_layer/variable, shape=(), dtype=int64, value=0>})}).
+FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_state_jax_registered_node_class - ValueError: Expected list, got ListWrapper([<keras.src.utils.jax_layer_test.TestJaxLayer.test_with_state_jax_registered_node_class.<locals>.NamedPoint object at 0x3923390a0>]).
+FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_training_in_call_fn_but_not_init_fn - ValueError: Expected dict, got DictWrapper({}).
+======================== 14 failed, 14 passed in 8.05s =========================
+============================= test session starts ==============================
+platform darwin -- Python 3.12.10, pytest-8.4.2, pluggy-1.6.0 -- /Users/wenyiguo/keras/venv/bin/python3.12
+cachedir: .pytest_cache
+rootdir: /Users/wenyiguo/keras
+configfile: pyproject.toml
+plugins: cov-7.0.0
+collecting ... collected 2 items
+
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_flax_layer_training_independent_bound_method FAILED [ 50%]
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_flax_layer_training_rng_unbound_method FAILED [100%]
+
+=================================== FAILURES ===================================
+________ TestJaxLayer.test_flax_layer_training_independent_bound_method ________
+
+self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_flax_layer_training_independent_bound_method>
+flax_model_class = <class 'keras.src.utils.jax_layer_test.FlaxTrainingIndependentModel'>
+flax_model_method = 'forward', init_kwargs = {}, trainable_weights = 8
+trainable_params = 648226, non_trainable_weights = 0, non_trainable_params = 0
+
+    @parameterized.named_parameters(
+        {
+            "testcase_name": "training_independent_bound_method",
+            "flax_model_class": "FlaxTrainingIndependentModel",
+            "flax_model_method": "forward",
+            "init_kwargs": {},
+            "trainable_weights": 8,
+            "trainable_params": 648226,
+            "non_trainable_weights": 0,
+            "non_trainable_params": 0,
+        },
+        {
+            "testcase_name": "training_rng_unbound_method",
+            "flax_model_class": "FlaxDropoutModel",
+            "flax_model_method": None,
+            "init_kwargs": {
+                "method": "flax_dropout_wrapper",
+            },
+            "trainable_weights": 8,
+            "trainable_params": 648226,
+            "non_trainable_weights": 0,
+            "non_trainable_params": 0,
+        },
+        # {
+        #     "testcase_name": "training_rng_state_no_method",
+        #     "flax_model_class": "FlaxBatchNormModel",
+        #     "flax_model_method": None,
+        #     "init_kwargs": {},
+        #     "trainable_weights": 13,
+        #     "trainable_params": 354258,
+        #     "non_trainable_weights": 8,
+        #     "non_trainable_params": 536,
+        # },
+        # {
+        #     "testcase_name": "training_rng_unbound_method_dtype_policy",
+        #     "flax_model_class": "FlaxDropoutModel",
+        #     "flax_model_method": None,
+        #     "init_kwargs": {
+        #         "method": "flax_dropout_wrapper",
+        #         "dtype": DTypePolicy("mixed_float16"),
+        #     },
+        #     "trainable_weights": 8,
+        #     "trainable_params": 648226,
+        #     "non_trainable_weights": 0,
+        #     "non_trainable_params": 0,
+        # },
+    )
+    @pytest.mark.skipif(flax is None, reason="Flax library is not available.")
+    def test_flax_layer(
+        self,
+        flax_model_class,
+        flax_model_method,
+        init_kwargs,
+        trainable_weights,
+        trainable_params,
+        non_trainable_weights,
+        non_trainable_params,
+    ):
+        flax_model_class = FLAX_OBJECTS.get(flax_model_class)
+        if "method" in init_kwargs:
+            init_kwargs["method"] = FLAX_OBJECTS.get(init_kwargs["method"])
+    
+        def create_wrapper(**kwargs):
+            params = kwargs.pop("params") if "params" in kwargs else None
+            state = kwargs.pop("state") if "state" in kwargs else None
+            if params and state:
+                variables = {**params, **state}
+            elif params:
+                variables = params
+            elif state:
+                variables = state
+            else:
+                variables = None
+            kwargs["variables"] = variables
+            flax_model = flax_model_class()
+            if flax_model_method:
+                kwargs["method"] = getattr(flax_model, flax_model_method)
+            if backend.backend() == "jax":
+                return FlaxLayer(flax_model_class(), **kwargs)
+            elif backend.backend() == "tensorflow":
+                return FlaxLayer(flax_model, stateless_compute_output_shape, **kwargs)
+    
+    
+>       self._test_layer(
+            flax_model_class.__name__,
+            create_wrapper,
+            init_kwargs,
+            trainable_weights,
+            trainable_params,
+            non_trainable_weights,
+            non_trainable_params,
+        )
+
+keras/src/utils/jax_layer_test.py:497: 
+_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
+keras/src/utils/jax_layer_test.py:254: in _test_layer
+    model1.fit(x_train, y_train, epochs=1, steps_per_epoch=10)
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/backend/tensorflow/trainer.py:399: in fit
+    logs = self.train_function(iterator)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/backend/tensorflow/trainer.py:241: in function
+    opt_outputs = multi_step_on_iterator(iterator)
+                  ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
+    return func(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^
+keras/src/backend/tensorflow/trainer.py:154: in multi_step_on_iterator
+    one_step_on_data(iterator.get_next())
+keras/src/backend/tensorflow/trainer.py:125: in wrapper
+    result = step_func(converted_data)
+             ^^^^^^^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
+    return func(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^
+keras/src/backend/tensorflow/trainer.py:134: in one_step_on_data
+    outputs = self.distribute_strategy.run(step_function, args=(data,))
+              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:1673: in run
+    return self._extended.call_for_each_replica(fn, args=args, kwargs=kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:3263: in call_for_each_replica
+    return self._call_for_each_replica(fn, args, kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:4061: in _call_for_each_replica
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
+    return func(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^
+keras/src/backend/tensorflow/trainer.py:59: in train_step
+    y_pred = self(x, training=True)
+             ^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/layers/layer.py:941: in __call__
+    outputs = super().__call__(*args, **kwargs)
+              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/ops/operation.py:77: in __call__
+    return self.call(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/models/functional.py:183: in call
+    outputs = self._run_through_graph(
+keras/src/ops/function.py:206: in _run_through_graph
+    outputs = op(*args, **kwargs)
+              ^^^^^^^^^^^^^^^^^^^
+keras/src/models/functional.py:644: in call
+    return operation(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/layers/layer.py:941: in __call__
+    outputs = super().__call__(*args, **kwargs)
+              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/ops/operation.py:77: in __call__
+    return self.call(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/jax_layer.py:609: in call
+    return call_with_fn(self.jax2tf_training_false_fn)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/jax_layer.py:586: in call_with_fn
+    jax.tree_util.tree_map(
+_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
+
+f = <function JaxLayer.call.<locals>.assign_state_to_variable at 0x31d82f740>
+tree = {}, is_leaf = None, rest = (DictWrapper({}),), leaves = []
+treedef = PyTreeDef({})
+
+    @export
+    def tree_map(f: Callable[..., Any],
+                 tree: Any,
+                 *rest: Any,
+                 is_leaf: Callable[[Any], bool] | None = None) -> Any:
+      """Alias of :func:`jax.tree.map`."""
+      leaves, treedef = tree_flatten(tree, is_leaf)
+>     all_leaves = [leaves] + [treedef.flatten_up_to(r) for r in rest]
+                               ^^^^^^^^^^^^^^^^^^^^^^^^
+E     ValueError: Expected dict, got DictWrapper({}).
+
+venv/lib/python3.12/site-packages/jax/_src/tree_util.py:357: ValueError
+----------------------------- Captured stdout call -----------------------------
+Model: "FlaxTrainingIndependentModel1"
+┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━┓
+┃ Layer (type)                    ┃ Output Shape           ┃       Param # ┃
+┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━┩
+│ input_layer (InputLayer)        │ (None, 28, 28, 1)      │             0 │
+├─────────────────────────────────┼────────────────────────┼───────────────┤
+│ flax_layer (FlaxLayer)          │ (None, 10)             │       648,226 │
+└─────────────────────────────────┴────────────────────────┴───────────────┘
+ Total params: 648,226 (2.47 MB)
+ Trainable params: 648,226 (2.47 MB)
+ Non-trainable params: 0 (0.00 B)
+----------------------------- Captured stderr call -----------------------------
+WARNING: All log messages before absl::InitializeLog() is called are written to STDERR
+I0000 00:00:1762560267.960370 1451585 service.cc:148] XLA service 0x15533c0f0 initialized for platform Host (this does not guarantee that XLA will be used). Devices:
+I0000 00:00:1762560267.960444 1451585 service.cc:156]   StreamExecutor device (0): Host, Default Version
+I0000 00:00:1762560267.986555 1451585 device_compiler.h:188] Compiled cluster using XLA!  This line is logged at most once for the lifetime of the process.
+___________ TestJaxLayer.test_flax_layer_training_rng_unbound_method ___________
+
+self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_flax_layer_training_rng_unbound_method>
+flax_model_class = <class 'keras.src.utils.jax_layer_test.FlaxDropoutModel'>
+flax_model_method = None
+init_kwargs = {'method': <function flax_dropout_wrapper at 0x1549f8900>}
+trainable_weights = 8, trainable_params = 648226, non_trainable_weights = 0
+non_trainable_params = 0
+
+    @parameterized.named_parameters(
+        {
+            "testcase_name": "training_independent_bound_method",
+            "flax_model_class": "FlaxTrainingIndependentModel",
+            "flax_model_method": "forward",
+            "init_kwargs": {},
+            "trainable_weights": 8,
+            "trainable_params": 648226,
+            "non_trainable_weights": 0,
+            "non_trainable_params": 0,
+        },
+        {
+            "testcase_name": "training_rng_unbound_method",
+            "flax_model_class": "FlaxDropoutModel",
+            "flax_model_method": None,
+            "init_kwargs": {
+                "method": "flax_dropout_wrapper",
+            },
+            "trainable_weights": 8,
+            "trainable_params": 648226,
+            "non_trainable_weights": 0,
+            "non_trainable_params": 0,
+        },
+        # {
+        #     "testcase_name": "training_rng_state_no_method",
+        #     "flax_model_class": "FlaxBatchNormModel",
+        #     "flax_model_method": None,
+        #     "init_kwargs": {},
+        #     "trainable_weights": 13,
+        #     "trainable_params": 354258,
+        #     "non_trainable_weights": 8,
+        #     "non_trainable_params": 536,
+        # },
+        # {
+        #     "testcase_name": "training_rng_unbound_method_dtype_policy",
+        #     "flax_model_class": "FlaxDropoutModel",
+        #     "flax_model_method": None,
+        #     "init_kwargs": {
+        #         "method": "flax_dropout_wrapper",
+        #         "dtype": DTypePolicy("mixed_float16"),
+        #     },
+        #     "trainable_weights": 8,
+        #     "trainable_params": 648226,
+        #     "non_trainable_weights": 0,
+        #     "non_trainable_params": 0,
+        # },
+    )
+    @pytest.mark.skipif(flax is None, reason="Flax library is not available.")
+    def test_flax_layer(
+        self,
+        flax_model_class,
+        flax_model_method,
+        init_kwargs,
+        trainable_weights,
+        trainable_params,
+        non_trainable_weights,
+        non_trainable_params,
+    ):
+        flax_model_class = FLAX_OBJECTS.get(flax_model_class)
+        if "method" in init_kwargs:
+            init_kwargs["method"] = FLAX_OBJECTS.get(init_kwargs["method"])
+    
+        def create_wrapper(**kwargs):
+            params = kwargs.pop("params") if "params" in kwargs else None
+            state = kwargs.pop("state") if "state" in kwargs else None
+            if params and state:
+                variables = {**params, **state}
+            elif params:
+                variables = params
+            elif state:
+                variables = state
+            else:
+                variables = None
+            kwargs["variables"] = variables
+            flax_model = flax_model_class()
+            if flax_model_method:
+                kwargs["method"] = getattr(flax_model, flax_model_method)
+            if backend.backend() == "jax":
+                return FlaxLayer(flax_model_class(), **kwargs)
+            elif backend.backend() == "tensorflow":
+                return FlaxLayer(flax_model, stateless_compute_output_shape, **kwargs)
+    
+    
+>       self._test_layer(
+            flax_model_class.__name__,
+            create_wrapper,
+            init_kwargs,
+            trainable_weights,
+            trainable_params,
+            non_trainable_weights,
+            non_trainable_params,
+        )
+
+keras/src/utils/jax_layer_test.py:497: 
+_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
+keras/src/utils/jax_layer_test.py:254: in _test_layer
+    model1.fit(x_train, y_train, epochs=1, steps_per_epoch=10)
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/backend/tensorflow/trainer.py:399: in fit
+    logs = self.train_function(iterator)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/backend/tensorflow/trainer.py:241: in function
+    opt_outputs = multi_step_on_iterator(iterator)
+                  ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
+    return func(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^
+keras/src/backend/tensorflow/trainer.py:154: in multi_step_on_iterator
+    one_step_on_data(iterator.get_next())
+keras/src/backend/tensorflow/trainer.py:125: in wrapper
+    result = step_func(converted_data)
+             ^^^^^^^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
+    return func(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^
+keras/src/backend/tensorflow/trainer.py:134: in one_step_on_data
+    outputs = self.distribute_strategy.run(step_function, args=(data,))
+              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:1673: in run
+    return self._extended.call_for_each_replica(fn, args=args, kwargs=kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:3263: in call_for_each_replica
+    return self._call_for_each_replica(fn, args, kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:4061: in _call_for_each_replica
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
+    return func(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^
+keras/src/backend/tensorflow/trainer.py:59: in train_step
+    y_pred = self(x, training=True)
+             ^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/layers/layer.py:941: in __call__
+    outputs = super().__call__(*args, **kwargs)
+              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/ops/operation.py:77: in __call__
+    return self.call(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/models/functional.py:183: in call
+    outputs = self._run_through_graph(
+keras/src/ops/function.py:206: in _run_through_graph
+    outputs = op(*args, **kwargs)
+              ^^^^^^^^^^^^^^^^^^^
+keras/src/models/functional.py:644: in call
+    return operation(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/layers/layer.py:941: in __call__
+    outputs = super().__call__(*args, **kwargs)
+              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/traceback_utils.py:113: in error_handler
+    return fn(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^
+keras/src/ops/operation.py:77: in __call__
+    return self.call(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/jax_layer.py:612: in call
+    return call_with_fn(self.jax2tf_training_true_fn)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+keras/src/utils/jax_layer.py:586: in call_with_fn
+    jax.tree_util.tree_map(
+_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
+
+f = <function JaxLayer.call.<locals>.assign_state_to_variable at 0x323642de0>
+tree = {}, is_leaf = None, rest = (DictWrapper({}),), leaves = []
+treedef = PyTreeDef({})
+
+    @export
+    def tree_map(f: Callable[..., Any],
+                 tree: Any,
+                 *rest: Any,
+                 is_leaf: Callable[[Any], bool] | None = None) -> Any:
+      """Alias of :func:`jax.tree.map`."""
+      leaves, treedef = tree_flatten(tree, is_leaf)
+>     all_leaves = [leaves] + [treedef.flatten_up_to(r) for r in rest]
+                               ^^^^^^^^^^^^^^^^^^^^^^^^
+E     ValueError: Expected dict, got DictWrapper({}).
+
+venv/lib/python3.12/site-packages/jax/_src/tree_util.py:357: ValueError
+----------------------------- Captured stdout call -----------------------------
+Model: "FlaxDropoutModel1"
+┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━┓
+┃ Layer (type)                    ┃ Output Shape           ┃       Param # ┃
+┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━┩
+│ input_layer (InputLayer)        │ (None, 28, 28, 1)      │             0 │
+├─────────────────────────────────┼────────────────────────┼───────────────┤
+│ flax_layer (FlaxLayer)          │ (None, 10)             │       648,226 │
+└─────────────────────────────────┴────────────────────────┴───────────────┘
+ Total params: 648,226 (2.47 MB)
+ Trainable params: 648,226 (2.47 MB)
+ Non-trainable params: 0 (0.00 B)
+=========================== short test summary info ============================
+FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_flax_layer_training_independent_bound_method - ValueError: Expected dict, got DictWrapper({}).
+FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_flax_layer_training_rng_unbound_method - ValueError: Expected dict, got DictWrapper({}).
+============================== 2 failed in 1.45s ===============================
diff --git a/output.txt b/output.txt
new file mode 100644
index 000000000000..6960ce8c14cb
--- /dev/null
+++ b/output.txt
@@ -0,0 +1,17 @@
+============================= test session starts ==============================
+platform darwin -- Python 3.12.10, pytest-8.4.2, pluggy-1.6.0 -- /Users/wenyiguo/keras/venv/bin/python3.12
+cachedir: .pytest_cache
+rootdir: /Users/wenyiguo/keras
+configfile: pyproject.toml
+plugins: cov-7.0.0
+collecting ... collected 25 items / 24 deselected / 1 selected
+
+keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_state_none_leaves 
+self.state: {'foo': None}
+new_state: {'foo': None}
+self.state after:  {'foo': None}
+pytree name _DictWrapper
+pytree name _DictWrapper
+PASSED
+
+======================= 1 passed, 24 deselected in 0.10s =======================

From 4d484d92e78044b5bab28a2e47725ece4ed92039 Mon Sep 17 00:00:00 2001
From: wenyi-guo <wenyiguo@google.com>
Date: Fri, 7 Nov 2025 16:51:16 -0800
Subject: [PATCH 04/12] format

---
 keras/src/utils/jax_layer.py | 61 ++++++++++++++----------------------
 1 file changed, 24 insertions(+), 37 deletions(-)

diff --git a/keras/src/utils/jax_layer.py b/keras/src/utils/jax_layer.py
index c5481115c085..d062a64f0707 100644
--- a/keras/src/utils/jax_layer.py
+++ b/keras/src/utils/jax_layer.py
@@ -1,8 +1,19 @@
 import inspect
 
+
+
+
+import collections
+import functools
+import itertools
+import keras
 import numpy as np
+import string
+import tensorflow as tf
 
+from jax.experimental import jax2tf 
 from keras.src import backend
+from keras.src import random
 from keras.src import tree
 from keras.src.api_export import keras_export
 from keras.src.backend.common.variables import is_float_dtype
@@ -12,22 +23,18 @@
 from keras.src.utils import jax_utils
 from keras.src.utils import tracking
 from keras.src.utils.module_utils import jax
-import tensorflow as tf
-from jax.experimental import jax2tf 
-import keras
-import itertools
-import string
-import functools
-from keras.src import random
-import logging
-import collections
+
+
+
 
 
 def standardize_pytree_collections(pytree):
     if isinstance(pytree, collections.abc.Mapping):
-        return {k: standardize_pytree_collections(v) for k, v in pytree.items()}
+        return {k: standardize_pytree_collections(v)
+                for k, v in pytree.items()}
     elif isinstance(pytree, collections.abc.Sequence):
-        return [standardize_pytree_collections(v) for v in pytree]
+        return [standardize_pytree_collections(v)
+                for v in pytree]
     else:
         return pytree
 
@@ -343,7 +350,6 @@ def get_single_jax2tf_shape(shape):
             return "(" + ", ".join(jax2tf_shape) + ")"
 
         res = tree.map_shape_structure(get_single_jax2tf_shape, input_shape)
-        logging.info("_get_jax2tf_input_shape res:", res)
         return res
 
     def _jax2tf_convert(self, fn, polymorphic_shapes):
@@ -475,9 +481,9 @@ def _initialize_weights(self, input_shape):
         if jax_utils.is_in_jax_tracing_scope() or tf.inside_function():
             # This exception is not actually shown, it is caught and a detailed
             # warning about calling 'build' is printed.
-            raise ValueError("'JaxLayer' cannot be built in tracing scope or inside tf function")
+            raise ValueError("'JaxLayer' cannot be built in tracing scope"
+                             "or inside tf function")
 
-        logging.info("_initialize_weights input_shape:", input_shape)
         # Initialize `params` and `state` if needed by calling `init_fn`.
         def create_input(shape):
             shape = [d if d is not None else 1 for d in shape]
@@ -582,29 +588,10 @@ def call_with_fn(fn):
                         assign_state_to_variable, new_state, self.state
                     )
                 elif backend.backend() == "tensorflow":
-                    # self.state = standardize_pytree_collections(self.state)
-                    print("\nself.state:", self.state)
-                    print("new_state:", new_state)
-                    print("self.state after: ", standardize_pytree_collections(self.state))
-                    print("pytree name", type(self.state).__name__)
-                    print("pytree name", type(new_state).__name__)
-                    jax.tree_util.tree_map(assign_state_to_variable, standardize_pytree_collections(new_state), standardize_pytree_collections(self.state))
-                    # jax.tree_util.tree_map(
-                    #     assign_state_to_variable, new_state, self.state
-                    # )
-                    # new_state_leaves = jax.tree_util.tree_leaves(new_state)
-                    # state_leaves = jax.tree_util.tree_leaves(self.state)
-                    # if len(new_state_leaves) != len(state_leaves):
-                    #     # This indicates a more fundamental structure divergence.
-                    #     raise ValueError(
-                    #         "State leaf count mismatch between jax2tf output and layer state: "
-                    #         f"{len(new_state_leaves)} vs {len(state_leaves)}. "
-                    #         f"new_state structure: {jax.tree_util.tree_structure(new_state)}, "
-                    #         f"self.state structure: {jax.tree_util.tree_structure(self.state)}"
-                    #     )
-                    # for new_val, state_leaf in zip(new_state_leaves, state_leaves):
-                    #     assign_state_to_variable(new_val, state_leaf)
-                    
+                    jax.tree_util.tree_map(
+                        assign_state_to_variable,
+                        standardize_pytree_collections(new_state),
+                        standardize_pytree_collections(self.state))
                 return predictions
             else:
                 return fn(*call_args)

From 1dfe1d3aa75d74b93377aa2fb18e3385ae94a326 Mon Sep 17 00:00:00 2001
From: wenyi-guo <wenyiguo@google.com>
Date: Fri, 7 Nov 2025 16:55:36 -0800
Subject: [PATCH 05/12] fix test

---
 keras/src/utils/jax_layer_test.py | 111 +++++++++++++++---------------
 1 file changed, 55 insertions(+), 56 deletions(-)

diff --git a/keras/src/utils/jax_layer_test.py b/keras/src/utils/jax_layer_test.py
index 157ae233eef4..83774adcd00d 100644
--- a/keras/src/utils/jax_layer_test.py
+++ b/keras/src/utils/jax_layer_test.py
@@ -238,11 +238,12 @@ def verify_weights_and_params(layer):
         )
         model1.summary()
 
+        verify_weights_and_params(layer1)
+
         model1.compile(
             loss="categorical_crossentropy",
             optimizer="adam",
             metrics=[metrics.CategoricalAccuracy()],
-            run_eagerly=True,
         )
 
         tw1_before_fit = tree.map_structure(
@@ -259,8 +260,6 @@ def verify_weights_and_params(layer):
             backend.convert_to_numpy, layer1.non_trainable_weights
         )
 
-        verify_weights_and_params(layer1)
-
         # verify both trainable and non-trainable weights did change after fit
         for before, after in zip(tw1_before_fit, tw1_after_fit):
             self.assertNotAllClose(before, after)
@@ -357,59 +356,59 @@ def call(self, inputs):
         output5 = model5(x_test)
         self.assertNotAllClose(output5, 0.0)
 
-    # @parameterized.named_parameters(
-        # {
-        #     "testcase_name": "training_independent",
-        #     "init_kwargs": {
-        #         "call_fn": jax_stateless_apply,
-        #         "init_fn": jax_stateless_init,
-        #     },
-        #     "trainable_weights": 6,
-        #     "trainable_params": 266610,
-        #     "non_trainable_weights": 0,
-        #     "non_trainable_params": 0,
-        # },
-        # {
-        #     "testcase_name": "training_state",
-        #     "init_kwargs": {
-        #         "call_fn": jax_stateful_apply,
-        #         "init_fn": jax_stateful_init,
-        #     },
-        #     "trainable_weights": 6,
-        #     "trainable_params": 266610,
-        #     "non_trainable_weights": 1,
-        #     "non_trainable_params": 1,
-        # },
-        # {
-        #     "testcase_name": "training_state_dtype_policy",
-        #     "init_kwargs": {
-        #         "call_fn": jax_stateful_apply,
-        #         "init_fn": jax_stateful_init,
-        #         "dtype": DTypePolicy("mixed_float16"),
-        #     },
-        #     "trainable_weights": 6,
-        #     "trainable_params": 266610,
-        #     "non_trainable_weights": 1,
-        #     "non_trainable_params": 1,
-        # },
-    # )
-    # def test_jax_layer(
-    #     self,
-    #     init_kwargs,
-    #     trainable_weights,
-    #     trainable_params,
-    #     non_trainable_weights,
-    #     non_trainable_params,
-    # ):
-    #     self._test_layer(
-    #         init_kwargs["call_fn"].__name__,
-    #         JaxLayer,
-    #         init_kwargs,
-    #         trainable_weights,
-    #         trainable_params,
-    #         non_trainable_weights,
-    #         non_trainable_params,
-    #     )
+    @parameterized.named_parameters(
+        {
+            "testcase_name": "training_independent",
+            "init_kwargs": {
+                "call_fn": jax_stateless_apply,
+                "init_fn": jax_stateless_init,
+            },
+            "trainable_weights": 6,
+            "trainable_params": 266610,
+            "non_trainable_weights": 0,
+            "non_trainable_params": 0,
+        },
+        {
+            "testcase_name": "training_state",
+            "init_kwargs": {
+                "call_fn": jax_stateful_apply,
+                "init_fn": jax_stateful_init,
+            },
+            "trainable_weights": 6,
+            "trainable_params": 266610,
+            "non_trainable_weights": 1,
+            "non_trainable_params": 1,
+        },
+        {
+            "testcase_name": "training_state_dtype_policy",
+            "init_kwargs": {
+                "call_fn": jax_stateful_apply,
+                "init_fn": jax_stateful_init,
+                "dtype": DTypePolicy("mixed_float16"),
+            },
+            "trainable_weights": 6,
+            "trainable_params": 266610,
+            "non_trainable_weights": 1,
+            "non_trainable_params": 1,
+        },
+    )
+    def test_jax_layer(
+        self,
+        init_kwargs,
+        trainable_weights,
+        trainable_params,
+        non_trainable_weights,
+        non_trainable_params,
+    ):
+        self._test_layer(
+            init_kwargs["call_fn"].__name__,
+            JaxLayer,
+            init_kwargs,
+            trainable_weights,
+            trainable_params,
+            non_trainable_weights,
+            non_trainable_params,
+        )
 
     @parameterized.named_parameters(
         {

From ce13e690adfd3dc4299b7c0cc37d4d031a325424 Mon Sep 17 00:00:00 2001
From: wenyi-guo <wenyiguo@google.com>
Date: Fri, 7 Nov 2025 17:04:39 -0800
Subject: [PATCH 06/12] format

---
 keras/src/utils/jax_layer.py | 13 +++++--------
 1 file changed, 5 insertions(+), 8 deletions(-)

diff --git a/keras/src/utils/jax_layer.py b/keras/src/utils/jax_layer.py
index d062a64f0707..beab12a361e8 100644
--- a/keras/src/utils/jax_layer.py
+++ b/keras/src/utils/jax_layer.py
@@ -1,17 +1,14 @@
 import inspect
 
-
-
-
 import collections
 import functools
 import itertools
-import keras
 import numpy as np
 import string
-import tensorflow as tf
 
+import jax
 from jax.experimental import jax2tf 
+import keras
 from keras.src import backend
 from keras.src import random
 from keras.src import tree
@@ -23,7 +20,7 @@
 from keras.src.utils import jax_utils
 from keras.src.utils import tracking
 from keras.src.utils.module_utils import jax
-
+import tensorflow as tf
 
 
 
@@ -249,8 +246,8 @@ def __init__(
     ):
         if backend.backend() not in ["jax", "tensorflow"]:
             raise ValueError(
-                "JaxLayer is only supported with the JAX or Tensorflow backend. Current "
-                f"backend: {backend.backend()}"
+                "JaxLayer is only supported with the JAX or Tensorflow backend. "
+                f"Current backend: {backend.backend()}"
             )
 
         if init_fn is None and params is None and state is None:

From fa00d7ad2f0e991ce4448d631b36ac59f40a4f88 Mon Sep 17 00:00:00 2001
From: wenyi-guo <wenyiguo@google.com>
Date: Fri, 7 Nov 2025 17:10:01 -0800
Subject: [PATCH 07/12] format

---
 keras/src/utils/jax_layer.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/keras/src/utils/jax_layer.py b/keras/src/utils/jax_layer.py
index beab12a361e8..cbd52567f6dd 100644
--- a/keras/src/utils/jax_layer.py
+++ b/keras/src/utils/jax_layer.py
@@ -246,8 +246,8 @@ def __init__(
     ):
         if backend.backend() not in ["jax", "tensorflow"]:
             raise ValueError(
-                "JaxLayer is only supported with the JAX or Tensorflow backend. "
-                f"Current backend: {backend.backend()}"
+                "JaxLayer is only supported with the JAX or Tensorflow backend"
+                f". Current backend: {backend.backend()}"
             )
 
         if init_fn is None and params is None and state is None:

From 57beea1aeabeb3e92acc11eb9b8de97355319bec Mon Sep 17 00:00:00 2001
From: wenyi-guo <wenyiguo@google.com>
Date: Fri, 7 Nov 2025 17:35:47 -0800
Subject: [PATCH 08/12] import fix

---
 keras/src/utils/jax_layer.py | 7 +++----
 1 file changed, 3 insertions(+), 4 deletions(-)

diff --git a/keras/src/utils/jax_layer.py b/keras/src/utils/jax_layer.py
index cbd52567f6dd..62d91d4cf948 100644
--- a/keras/src/utils/jax_layer.py
+++ b/keras/src/utils/jax_layer.py
@@ -6,9 +6,7 @@
 import numpy as np
 import string
 
-import jax
 from jax.experimental import jax2tf 
-import keras
 from keras.src import backend
 from keras.src import random
 from keras.src import tree
@@ -19,8 +17,9 @@
 from keras.src.saving import serialization_lib
 from keras.src.utils import jax_utils
 from keras.src.utils import tracking
+from keras.src import ops
 from keras.src.utils.module_utils import jax
-import tensorflow as tf
+from keras.src.utils.module_utils import tensorflow as tf
 
 
 
@@ -484,7 +483,7 @@ def _initialize_weights(self, input_shape):
         # Initialize `params` and `state` if needed by calling `init_fn`.
         def create_input(shape):
             shape = [d if d is not None else 1 for d in shape]
-            return keras.ops.ones(shape)
+            return ops.ones(shape)
         
         init_inputs = tree.map_shape_structure(create_input, input_shape)
         init_args = []

From 9e6afa923fda6ab2a3240e433021b94f84a14c4c Mon Sep 17 00:00:00 2001
From: wenyi-guo <wenyiguo@google.com>
Date: Fri, 7 Nov 2025 17:47:02 -0800
Subject: [PATCH 09/12] fix import

---
 keras/src/utils/jax_layer.py         |    2 +-
 keras/src/utils/keras.code-workspace |    7 -
 log.log                              | 1911 --------------------------
 output.txt                           |   17 -
 4 files changed, 1 insertion(+), 1936 deletions(-)
 delete mode 100644 keras/src/utils/keras.code-workspace
 delete mode 100644 log.log
 delete mode 100644 output.txt

diff --git a/keras/src/utils/jax_layer.py b/keras/src/utils/jax_layer.py
index 62d91d4cf948..7a9cb9524556 100644
--- a/keras/src/utils/jax_layer.py
+++ b/keras/src/utils/jax_layer.py
@@ -6,7 +6,6 @@
 import numpy as np
 import string
 
-from jax.experimental import jax2tf 
 from keras.src import backend
 from keras.src import random
 from keras.src import tree
@@ -19,6 +18,7 @@
 from keras.src.utils import tracking
 from keras.src import ops
 from keras.src.utils.module_utils import jax
+from jax.experimental import jax2tf 
 from keras.src.utils.module_utils import tensorflow as tf
 
 
diff --git a/keras/src/utils/keras.code-workspace b/keras/src/utils/keras.code-workspace
deleted file mode 100644
index 084403744299..000000000000
--- a/keras/src/utils/keras.code-workspace
+++ /dev/null
@@ -1,7 +0,0 @@
-{
-    "folders": [
-        {
-            "path": "../.."
-        }
-    ]
-}
\ No newline at end of file
diff --git a/log.log b/log.log
deleted file mode 100644
index 4012ad0c1e91..000000000000
--- a/log.log
+++ /dev/null
@@ -1,1911 +0,0 @@
-============================= test session starts ==============================
-platform darwin -- Python 3.12.10, pytest-8.4.2, pluggy-1.6.0 -- /Users/wenyiguo/keras/venv/bin/python3.12
-cachedir: .pytest_cache
-rootdir: /Users/wenyiguo/keras
-configfile: pyproject.toml
-plugins: cov-7.0.0
-collecting ... collected 28 items
-
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_flax_layer_training_independent_bound_method FAILED [  3%]
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_flax_layer_training_rng_state_no_method FAILED [  7%]
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_flax_layer_training_rng_unbound_method FAILED [ 10%]
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_flax_layer_training_rng_unbound_method_dtype_policy FAILED [ 14%]
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_jax_layer_training_independent PASSED [ 17%]
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_jax_layer_training_state PASSED [ 21%]
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_jax_layer_training_state_dtype_policy PASSED [ 25%]
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_rng_seeding PASSED [ 28%]
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_state_mismatch_during_update_mapping_instead_of_sequence FAILED [ 32%]
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_state_mismatch_during_update_missing_dict_key FAILED [ 35%]
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_state_mismatch_during_update_missing_variable_in_list FAILED [ 39%]
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_state_mismatch_during_update_no_initial_state FAILED [ 42%]
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_state_mismatch_during_update_sequence_instead_of_mapping FAILED [ 46%]
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_state_mismatch_during_update_sequence_instead_of_variable FAILED [ 50%]
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_different_argument_order FAILED [ 53%]
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_flax_state_no_params FAILED [ 57%]
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_minimal_arguments PASSED [ 60%]
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_missing_inputs_in_call_fn PASSED [ 64%]
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_missing_inputs_in_init_fn PASSED [ 67%]
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_no_init_fn_and_no_params PASSED [ 71%]
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_polymorphic_shape_more_than_26_dimension_names PASSED [ 75%]
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_state_jax_registered_node_class FAILED [ 78%]
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_state_non_tensor_leaves PASSED [ 82%]
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_state_none_leaves PASSED [ 85%]
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_structures_as_inputs_and_outputs PASSED [ 89%]
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_training_in_call_fn_but_not_init_fn FAILED [ 92%]
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_unsupported_argument_in_call_fn PASSED [ 96%]
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_unsupported_argument_in_init_fn PASSED [100%]
-
-=================================== FAILURES ===================================
-________ TestJaxLayer.test_flax_layer_training_independent_bound_method ________
-
-self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_flax_layer_training_independent_bound_method>
-flax_model_class = <class 'keras.src.utils.jax_layer_test.FlaxTrainingIndependentModel'>
-flax_model_method = 'forward', init_kwargs = {}, trainable_weights = 8
-trainable_params = 648226, non_trainable_weights = 0, non_trainable_params = 0
-
-    @parameterized.named_parameters(
-        {
-            "testcase_name": "training_independent_bound_method",
-            "flax_model_class": "FlaxTrainingIndependentModel",
-            "flax_model_method": "forward",
-            "init_kwargs": {},
-            "trainable_weights": 8,
-            "trainable_params": 648226,
-            "non_trainable_weights": 0,
-            "non_trainable_params": 0,
-        },
-        {
-            "testcase_name": "training_rng_unbound_method",
-            "flax_model_class": "FlaxDropoutModel",
-            "flax_model_method": None,
-            "init_kwargs": {
-                "method": "flax_dropout_wrapper",
-            },
-            "trainable_weights": 8,
-            "trainable_params": 648226,
-            "non_trainable_weights": 0,
-            "non_trainable_params": 0,
-        },
-        {
-            "testcase_name": "training_rng_state_no_method",
-            "flax_model_class": "FlaxBatchNormModel",
-            "flax_model_method": None,
-            "init_kwargs": {},
-            "trainable_weights": 13,
-            "trainable_params": 354258,
-            "non_trainable_weights": 8,
-            "non_trainable_params": 536,
-        },
-        {
-            "testcase_name": "training_rng_unbound_method_dtype_policy",
-            "flax_model_class": "FlaxDropoutModel",
-            "flax_model_method": None,
-            "init_kwargs": {
-                "method": "flax_dropout_wrapper",
-                "dtype": DTypePolicy("mixed_float16"),
-            },
-            "trainable_weights": 8,
-            "trainable_params": 648226,
-            "non_trainable_weights": 0,
-            "non_trainable_params": 0,
-        },
-    )
-    @pytest.mark.skipif(flax is None, reason="Flax library is not available.")
-    def test_flax_layer(
-        self,
-        flax_model_class,
-        flax_model_method,
-        init_kwargs,
-        trainable_weights,
-        trainable_params,
-        non_trainable_weights,
-        non_trainable_params,
-    ):
-        flax_model_class = FLAX_OBJECTS.get(flax_model_class)
-        if "method" in init_kwargs:
-            init_kwargs["method"] = FLAX_OBJECTS.get(init_kwargs["method"])
-    
-        def create_wrapper(**kwargs):
-            params = kwargs.pop("params") if "params" in kwargs else None
-            state = kwargs.pop("state") if "state" in kwargs else None
-            if params and state:
-                variables = {**params, **state}
-            elif params:
-                variables = params
-            elif state:
-                variables = state
-            else:
-                variables = None
-            kwargs["variables"] = variables
-            flax_model = flax_model_class()
-            if flax_model_method:
-                kwargs["method"] = getattr(flax_model, flax_model_method)
-            if backend.backend() == "jax":
-                return FlaxLayer(flax_model_class(), **kwargs)
-            elif backend.backend() == "tensorflow":
-                return FlaxLayer(flax_model, stateless_compute_output_shape, **kwargs)
-    
-    
->       self._test_layer(
-            flax_model_class.__name__,
-            create_wrapper,
-            init_kwargs,
-            trainable_weights,
-            trainable_params,
-            non_trainable_weights,
-            non_trainable_params,
-        )
-
-keras/src/utils/jax_layer_test.py:497: 
-_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
-keras/src/utils/jax_layer_test.py:254: in _test_layer
-    model1.fit(x_train, y_train, epochs=1, steps_per_epoch=10)
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/backend/tensorflow/trainer.py:399: in fit
-    logs = self.train_function(iterator)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/backend/tensorflow/trainer.py:241: in function
-    opt_outputs = multi_step_on_iterator(iterator)
-                  ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
-    return func(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^
-keras/src/backend/tensorflow/trainer.py:154: in multi_step_on_iterator
-    one_step_on_data(iterator.get_next())
-keras/src/backend/tensorflow/trainer.py:125: in wrapper
-    result = step_func(converted_data)
-             ^^^^^^^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
-    return func(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^
-keras/src/backend/tensorflow/trainer.py:134: in one_step_on_data
-    outputs = self.distribute_strategy.run(step_function, args=(data,))
-              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:1673: in run
-    return self._extended.call_for_each_replica(fn, args=args, kwargs=kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:3263: in call_for_each_replica
-    return self._call_for_each_replica(fn, args, kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:4061: in _call_for_each_replica
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
-    return func(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^
-keras/src/backend/tensorflow/trainer.py:59: in train_step
-    y_pred = self(x, training=True)
-             ^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/layers/layer.py:941: in __call__
-    outputs = super().__call__(*args, **kwargs)
-              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/ops/operation.py:77: in __call__
-    return self.call(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/models/functional.py:183: in call
-    outputs = self._run_through_graph(
-keras/src/ops/function.py:206: in _run_through_graph
-    outputs = op(*args, **kwargs)
-              ^^^^^^^^^^^^^^^^^^^
-keras/src/models/functional.py:644: in call
-    return operation(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/layers/layer.py:941: in __call__
-    outputs = super().__call__(*args, **kwargs)
-              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/ops/operation.py:77: in __call__
-    return self.call(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/jax_layer.py:609: in call
-    return call_with_fn(self.jax2tf_training_false_fn)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/jax_layer.py:586: in call_with_fn
-    jax.tree_util.tree_map(
-_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
-
-f = <function JaxLayer.call.<locals>.assign_state_to_variable at 0x34ec467a0>
-tree = {}, is_leaf = None, rest = (DictWrapper({}),), leaves = []
-treedef = PyTreeDef({})
-
-    @export
-    def tree_map(f: Callable[..., Any],
-                 tree: Any,
-                 *rest: Any,
-                 is_leaf: Callable[[Any], bool] | None = None) -> Any:
-      """Alias of :func:`jax.tree.map`."""
-      leaves, treedef = tree_flatten(tree, is_leaf)
->     all_leaves = [leaves] + [treedef.flatten_up_to(r) for r in rest]
-                               ^^^^^^^^^^^^^^^^^^^^^^^^
-E     ValueError: Expected dict, got DictWrapper({}).
-
-venv/lib/python3.12/site-packages/jax/_src/tree_util.py:357: ValueError
------------------------------ Captured stdout call -----------------------------
-Model: "FlaxTrainingIndependentModel1"
-┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━┓
-┃ Layer (type)                    ┃ Output Shape           ┃       Param # ┃
-┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━┩
-│ input_layer (InputLayer)        │ (None, 28, 28, 1)      │             0 │
-├─────────────────────────────────┼────────────────────────┼───────────────┤
-│ flax_layer (FlaxLayer)          │ (None, 10)             │       648,226 │
-└─────────────────────────────────┴────────────────────────┴───────────────┘
- Total params: 648,226 (2.47 MB)
- Trainable params: 648,226 (2.47 MB)
- Non-trainable params: 0 (0.00 B)
------------------------------ Captured stderr call -----------------------------
-WARNING: All log messages before absl::InitializeLog() is called are written to STDERR
-I0000 00:00:1762560145.098912 1448076 service.cc:148] XLA service 0x11f0dbaf0 initialized for platform Host (this does not guarantee that XLA will be used). Devices:
-I0000 00:00:1762560145.098989 1448076 service.cc:156]   StreamExecutor device (0): Host, Default Version
-I0000 00:00:1762560145.119877 1448076 device_compiler.h:188] Compiled cluster using XLA!  This line is logged at most once for the lifetime of the process.
-__________ TestJaxLayer.test_flax_layer_training_rng_state_no_method ___________
-
-self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_flax_layer_training_rng_state_no_method>
-flax_model_class = <class 'keras.src.utils.jax_layer_test.FlaxBatchNormModel'>
-flax_model_method = None, init_kwargs = {}, trainable_weights = 13
-trainable_params = 354258, non_trainable_weights = 8, non_trainable_params = 536
-
-    @parameterized.named_parameters(
-        {
-            "testcase_name": "training_independent_bound_method",
-            "flax_model_class": "FlaxTrainingIndependentModel",
-            "flax_model_method": "forward",
-            "init_kwargs": {},
-            "trainable_weights": 8,
-            "trainable_params": 648226,
-            "non_trainable_weights": 0,
-            "non_trainable_params": 0,
-        },
-        {
-            "testcase_name": "training_rng_unbound_method",
-            "flax_model_class": "FlaxDropoutModel",
-            "flax_model_method": None,
-            "init_kwargs": {
-                "method": "flax_dropout_wrapper",
-            },
-            "trainable_weights": 8,
-            "trainable_params": 648226,
-            "non_trainable_weights": 0,
-            "non_trainable_params": 0,
-        },
-        {
-            "testcase_name": "training_rng_state_no_method",
-            "flax_model_class": "FlaxBatchNormModel",
-            "flax_model_method": None,
-            "init_kwargs": {},
-            "trainable_weights": 13,
-            "trainable_params": 354258,
-            "non_trainable_weights": 8,
-            "non_trainable_params": 536,
-        },
-        {
-            "testcase_name": "training_rng_unbound_method_dtype_policy",
-            "flax_model_class": "FlaxDropoutModel",
-            "flax_model_method": None,
-            "init_kwargs": {
-                "method": "flax_dropout_wrapper",
-                "dtype": DTypePolicy("mixed_float16"),
-            },
-            "trainable_weights": 8,
-            "trainable_params": 648226,
-            "non_trainable_weights": 0,
-            "non_trainable_params": 0,
-        },
-    )
-    @pytest.mark.skipif(flax is None, reason="Flax library is not available.")
-    def test_flax_layer(
-        self,
-        flax_model_class,
-        flax_model_method,
-        init_kwargs,
-        trainable_weights,
-        trainable_params,
-        non_trainable_weights,
-        non_trainable_params,
-    ):
-        flax_model_class = FLAX_OBJECTS.get(flax_model_class)
-        if "method" in init_kwargs:
-            init_kwargs["method"] = FLAX_OBJECTS.get(init_kwargs["method"])
-    
-        def create_wrapper(**kwargs):
-            params = kwargs.pop("params") if "params" in kwargs else None
-            state = kwargs.pop("state") if "state" in kwargs else None
-            if params and state:
-                variables = {**params, **state}
-            elif params:
-                variables = params
-            elif state:
-                variables = state
-            else:
-                variables = None
-            kwargs["variables"] = variables
-            flax_model = flax_model_class()
-            if flax_model_method:
-                kwargs["method"] = getattr(flax_model, flax_model_method)
-            if backend.backend() == "jax":
-                return FlaxLayer(flax_model_class(), **kwargs)
-            elif backend.backend() == "tensorflow":
-                return FlaxLayer(flax_model, stateless_compute_output_shape, **kwargs)
-    
-    
->       self._test_layer(
-            flax_model_class.__name__,
-            create_wrapper,
-            init_kwargs,
-            trainable_weights,
-            trainable_params,
-            non_trainable_weights,
-            non_trainable_params,
-        )
-
-keras/src/utils/jax_layer_test.py:497: 
-_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
-keras/src/utils/jax_layer_test.py:254: in _test_layer
-    model1.fit(x_train, y_train, epochs=1, steps_per_epoch=10)
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/backend/tensorflow/trainer.py:399: in fit
-    logs = self.train_function(iterator)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/backend/tensorflow/trainer.py:241: in function
-    opt_outputs = multi_step_on_iterator(iterator)
-                  ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
-    return func(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^
-keras/src/backend/tensorflow/trainer.py:154: in multi_step_on_iterator
-    one_step_on_data(iterator.get_next())
-keras/src/backend/tensorflow/trainer.py:125: in wrapper
-    result = step_func(converted_data)
-             ^^^^^^^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
-    return func(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^
-keras/src/backend/tensorflow/trainer.py:134: in one_step_on_data
-    outputs = self.distribute_strategy.run(step_function, args=(data,))
-              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:1673: in run
-    return self._extended.call_for_each_replica(fn, args=args, kwargs=kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:3263: in call_for_each_replica
-    return self._call_for_each_replica(fn, args, kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:4061: in _call_for_each_replica
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
-    return func(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^
-keras/src/backend/tensorflow/trainer.py:59: in train_step
-    y_pred = self(x, training=True)
-             ^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/layers/layer.py:941: in __call__
-    outputs = super().__call__(*args, **kwargs)
-              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/ops/operation.py:77: in __call__
-    return self.call(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/models/functional.py:183: in call
-    outputs = self._run_through_graph(
-keras/src/ops/function.py:206: in _run_through_graph
-    outputs = op(*args, **kwargs)
-              ^^^^^^^^^^^^^^^^^^^
-keras/src/models/functional.py:644: in call
-    return operation(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/layers/layer.py:941: in __call__
-    outputs = super().__call__(*args, **kwargs)
-              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/ops/operation.py:77: in __call__
-    return self.call(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/jax_layer.py:612: in call
-    return call_with_fn(self.jax2tf_training_true_fn)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/jax_layer.py:586: in call_with_fn
-    jax.tree_util.tree_map(
-_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
-
-f = <function JaxLayer.call.<locals>.assign_state_to_variable at 0x36cc81580>
-tree = {'batch_stats': {'BatchNorm_0': {'mean': <tf.Tensor: shape=(12,), dtype=float32, numpy=
-array([-0.00319871, -0.0067011... , 0.997175  , 1.0033267 ,
-       0.99977   , 0.99732304, 1.0004325 , 0.99955   , 0.99559575],
-      dtype=float32)>}}}
-is_leaf = None
-rest = (DictWrapper({'batch_stats': DictWrapper({'BatchNorm_0': DictWrapper({'mean': <Variable path=flax_layer/variable_13, s...1. 1. 1. 1.
- 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
- 1. 1. 1. 1. 1. 1. 1. 1.]>})})}),)
-leaves = [<tf.Tensor: shape=(12,), dtype=float32, numpy=
-array([-0.00319871, -0.00670112, -0.0096636 , -0.00773753, -0.0039517 ...      0.9931413 , 0.9929665 , 0.99336755, 0.9929529 , 0.992772  ,
-       0.9927061 , 0.9929846 ], dtype=float32)>, ...]
-treedef = PyTreeDef({'batch_stats': {'BatchNorm_0': {'mean': *, 'var': *}, 'BatchNorm_1': {'mean': *, 'var': *}, 'BatchNorm_2': {'mean': *, 'var': *}, 'BatchNorm_3': {'mean': *, 'var': *}}})
-
-    @export
-    def tree_map(f: Callable[..., Any],
-                 tree: Any,
-                 *rest: Any,
-                 is_leaf: Callable[[Any], bool] | None = None) -> Any:
-      """Alias of :func:`jax.tree.map`."""
-      leaves, treedef = tree_flatten(tree, is_leaf)
->     all_leaves = [leaves] + [treedef.flatten_up_to(r) for r in rest]
-                               ^^^^^^^^^^^^^^^^^^^^^^^^
-E     ValueError: Expected dict, got DictWrapper({'batch_stats': DictWrapper({'BatchNorm_0': DictWrapper({'mean': <Variable path=flax_layer/variable_13, shape=(12,), dtype=float32, value=[0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.]>, 'var': <Variable path=flax_layer/variable_14, shape=(12,), dtype=float32, value=[1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.]>}), 'BatchNorm_1': DictWrapper({'mean': <Variable path=flax_layer/variable_15, shape=(24,), dtype=float32, value=[0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.]>, 'var': <Variable path=flax_layer/variable_16, shape=(24,), dtype=float32, value=[1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.]>}), 'BatchNorm_2': DictWrapper({'mean': <Variable path=flax_layer/variable_17, shape=(32,), dtype=float32, value=[0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
-E      0. 0. 0. 0. 0. 0. 0. 0.]>, 'var': <Variable path=flax_layer/variable_18, shape=(32,), dtype=float32, value=[1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
-E      1. 1. 1. 1. 1. 1. 1. 1.]>}), 'BatchNorm_3': DictWrapper({'mean': <Variable path=flax_layer/variable_19, shape=(200,), dtype=float32, value=[0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
-E      0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
-E      0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
-E      0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
-E      0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
-E      0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
-E      0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
-E      0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
-E      0. 0. 0. 0. 0. 0. 0. 0.]>, 'var': <Variable path=flax_layer/variable_20, shape=(200,), dtype=float32, value=[1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
-E      1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
-E      1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
-E      1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
-E      1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
-E      1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
-E      1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
-E      1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
-E      1. 1. 1. 1. 1. 1. 1. 1.]>})})}).
-
-venv/lib/python3.12/site-packages/jax/_src/tree_util.py:357: ValueError
------------------------------ Captured stdout call -----------------------------
-Model: "FlaxBatchNormModel1"
-┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━┓
-┃ Layer (type)                    ┃ Output Shape           ┃       Param # ┃
-┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━┩
-│ input_layer (InputLayer)        │ (None, 28, 28, 1)      │             0 │
-├─────────────────────────────────┼────────────────────────┼───────────────┤
-│ flax_layer (FlaxLayer)          │ (None, 10)             │       354,794 │
-└─────────────────────────────────┴────────────────────────┴───────────────┘
- Total params: 354,794 (1.35 MB)
- Trainable params: 354,258 (1.35 MB)
- Non-trainable params: 536 (2.09 KB)
-___________ TestJaxLayer.test_flax_layer_training_rng_unbound_method ___________
-
-self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_flax_layer_training_rng_unbound_method>
-flax_model_class = <class 'keras.src.utils.jax_layer_test.FlaxDropoutModel'>
-flax_model_method = None
-init_kwargs = {'method': <function flax_dropout_wrapper at 0x16a760860>}
-trainable_weights = 8, trainable_params = 648226, non_trainable_weights = 0
-non_trainable_params = 0
-
-    @parameterized.named_parameters(
-        {
-            "testcase_name": "training_independent_bound_method",
-            "flax_model_class": "FlaxTrainingIndependentModel",
-            "flax_model_method": "forward",
-            "init_kwargs": {},
-            "trainable_weights": 8,
-            "trainable_params": 648226,
-            "non_trainable_weights": 0,
-            "non_trainable_params": 0,
-        },
-        {
-            "testcase_name": "training_rng_unbound_method",
-            "flax_model_class": "FlaxDropoutModel",
-            "flax_model_method": None,
-            "init_kwargs": {
-                "method": "flax_dropout_wrapper",
-            },
-            "trainable_weights": 8,
-            "trainable_params": 648226,
-            "non_trainable_weights": 0,
-            "non_trainable_params": 0,
-        },
-        {
-            "testcase_name": "training_rng_state_no_method",
-            "flax_model_class": "FlaxBatchNormModel",
-            "flax_model_method": None,
-            "init_kwargs": {},
-            "trainable_weights": 13,
-            "trainable_params": 354258,
-            "non_trainable_weights": 8,
-            "non_trainable_params": 536,
-        },
-        {
-            "testcase_name": "training_rng_unbound_method_dtype_policy",
-            "flax_model_class": "FlaxDropoutModel",
-            "flax_model_method": None,
-            "init_kwargs": {
-                "method": "flax_dropout_wrapper",
-                "dtype": DTypePolicy("mixed_float16"),
-            },
-            "trainable_weights": 8,
-            "trainable_params": 648226,
-            "non_trainable_weights": 0,
-            "non_trainable_params": 0,
-        },
-    )
-    @pytest.mark.skipif(flax is None, reason="Flax library is not available.")
-    def test_flax_layer(
-        self,
-        flax_model_class,
-        flax_model_method,
-        init_kwargs,
-        trainable_weights,
-        trainable_params,
-        non_trainable_weights,
-        non_trainable_params,
-    ):
-        flax_model_class = FLAX_OBJECTS.get(flax_model_class)
-        if "method" in init_kwargs:
-            init_kwargs["method"] = FLAX_OBJECTS.get(init_kwargs["method"])
-    
-        def create_wrapper(**kwargs):
-            params = kwargs.pop("params") if "params" in kwargs else None
-            state = kwargs.pop("state") if "state" in kwargs else None
-            if params and state:
-                variables = {**params, **state}
-            elif params:
-                variables = params
-            elif state:
-                variables = state
-            else:
-                variables = None
-            kwargs["variables"] = variables
-            flax_model = flax_model_class()
-            if flax_model_method:
-                kwargs["method"] = getattr(flax_model, flax_model_method)
-            if backend.backend() == "jax":
-                return FlaxLayer(flax_model_class(), **kwargs)
-            elif backend.backend() == "tensorflow":
-                return FlaxLayer(flax_model, stateless_compute_output_shape, **kwargs)
-    
-    
->       self._test_layer(
-            flax_model_class.__name__,
-            create_wrapper,
-            init_kwargs,
-            trainable_weights,
-            trainable_params,
-            non_trainable_weights,
-            non_trainable_params,
-        )
-
-keras/src/utils/jax_layer_test.py:497: 
-_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
-keras/src/utils/jax_layer_test.py:254: in _test_layer
-    model1.fit(x_train, y_train, epochs=1, steps_per_epoch=10)
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/backend/tensorflow/trainer.py:399: in fit
-    logs = self.train_function(iterator)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/backend/tensorflow/trainer.py:241: in function
-    opt_outputs = multi_step_on_iterator(iterator)
-                  ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
-    return func(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^
-keras/src/backend/tensorflow/trainer.py:154: in multi_step_on_iterator
-    one_step_on_data(iterator.get_next())
-keras/src/backend/tensorflow/trainer.py:125: in wrapper
-    result = step_func(converted_data)
-             ^^^^^^^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
-    return func(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^
-keras/src/backend/tensorflow/trainer.py:134: in one_step_on_data
-    outputs = self.distribute_strategy.run(step_function, args=(data,))
-              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:1673: in run
-    return self._extended.call_for_each_replica(fn, args=args, kwargs=kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:3263: in call_for_each_replica
-    return self._call_for_each_replica(fn, args, kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:4061: in _call_for_each_replica
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
-    return func(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^
-keras/src/backend/tensorflow/trainer.py:59: in train_step
-    y_pred = self(x, training=True)
-             ^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/layers/layer.py:941: in __call__
-    outputs = super().__call__(*args, **kwargs)
-              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/ops/operation.py:77: in __call__
-    return self.call(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/models/functional.py:183: in call
-    outputs = self._run_through_graph(
-keras/src/ops/function.py:206: in _run_through_graph
-    outputs = op(*args, **kwargs)
-              ^^^^^^^^^^^^^^^^^^^
-keras/src/models/functional.py:644: in call
-    return operation(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/layers/layer.py:941: in __call__
-    outputs = super().__call__(*args, **kwargs)
-              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/ops/operation.py:77: in __call__
-    return self.call(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/jax_layer.py:612: in call
-    return call_with_fn(self.jax2tf_training_true_fn)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/jax_layer.py:586: in call_with_fn
-    jax.tree_util.tree_map(
-_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
-
-f = <function JaxLayer.call.<locals>.assign_state_to_variable at 0x36e4ebb00>
-tree = {}, is_leaf = None, rest = (DictWrapper({}),), leaves = []
-treedef = PyTreeDef({})
-
-    @export
-    def tree_map(f: Callable[..., Any],
-                 tree: Any,
-                 *rest: Any,
-                 is_leaf: Callable[[Any], bool] | None = None) -> Any:
-      """Alias of :func:`jax.tree.map`."""
-      leaves, treedef = tree_flatten(tree, is_leaf)
->     all_leaves = [leaves] + [treedef.flatten_up_to(r) for r in rest]
-                               ^^^^^^^^^^^^^^^^^^^^^^^^
-E     ValueError: Expected dict, got DictWrapper({}).
-
-venv/lib/python3.12/site-packages/jax/_src/tree_util.py:357: ValueError
------------------------------ Captured stdout call -----------------------------
-Model: "FlaxDropoutModel1"
-┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━┓
-┃ Layer (type)                    ┃ Output Shape           ┃       Param # ┃
-┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━┩
-│ input_layer (InputLayer)        │ (None, 28, 28, 1)      │             0 │
-├─────────────────────────────────┼────────────────────────┼───────────────┤
-│ flax_layer (FlaxLayer)          │ (None, 10)             │       648,226 │
-└─────────────────────────────────┴────────────────────────┴───────────────┘
- Total params: 648,226 (2.47 MB)
- Trainable params: 648,226 (2.47 MB)
- Non-trainable params: 0 (0.00 B)
-____ TestJaxLayer.test_flax_layer_training_rng_unbound_method_dtype_policy _____
-
-self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_flax_layer_training_rng_unbound_method_dtype_policy>
-flax_model_class = <class 'keras.src.utils.jax_layer_test.FlaxDropoutModel'>
-flax_model_method = None
-init_kwargs = {'dtype': <DTypePolicy "mixed_float16">, 'method': <function flax_dropout_wrapper at 0x16a760860>}
-trainable_weights = 8, trainable_params = 648226, non_trainable_weights = 0
-non_trainable_params = 0
-
-    @parameterized.named_parameters(
-        {
-            "testcase_name": "training_independent_bound_method",
-            "flax_model_class": "FlaxTrainingIndependentModel",
-            "flax_model_method": "forward",
-            "init_kwargs": {},
-            "trainable_weights": 8,
-            "trainable_params": 648226,
-            "non_trainable_weights": 0,
-            "non_trainable_params": 0,
-        },
-        {
-            "testcase_name": "training_rng_unbound_method",
-            "flax_model_class": "FlaxDropoutModel",
-            "flax_model_method": None,
-            "init_kwargs": {
-                "method": "flax_dropout_wrapper",
-            },
-            "trainable_weights": 8,
-            "trainable_params": 648226,
-            "non_trainable_weights": 0,
-            "non_trainable_params": 0,
-        },
-        {
-            "testcase_name": "training_rng_state_no_method",
-            "flax_model_class": "FlaxBatchNormModel",
-            "flax_model_method": None,
-            "init_kwargs": {},
-            "trainable_weights": 13,
-            "trainable_params": 354258,
-            "non_trainable_weights": 8,
-            "non_trainable_params": 536,
-        },
-        {
-            "testcase_name": "training_rng_unbound_method_dtype_policy",
-            "flax_model_class": "FlaxDropoutModel",
-            "flax_model_method": None,
-            "init_kwargs": {
-                "method": "flax_dropout_wrapper",
-                "dtype": DTypePolicy("mixed_float16"),
-            },
-            "trainable_weights": 8,
-            "trainable_params": 648226,
-            "non_trainable_weights": 0,
-            "non_trainable_params": 0,
-        },
-    )
-    @pytest.mark.skipif(flax is None, reason="Flax library is not available.")
-    def test_flax_layer(
-        self,
-        flax_model_class,
-        flax_model_method,
-        init_kwargs,
-        trainable_weights,
-        trainable_params,
-        non_trainable_weights,
-        non_trainable_params,
-    ):
-        flax_model_class = FLAX_OBJECTS.get(flax_model_class)
-        if "method" in init_kwargs:
-            init_kwargs["method"] = FLAX_OBJECTS.get(init_kwargs["method"])
-    
-        def create_wrapper(**kwargs):
-            params = kwargs.pop("params") if "params" in kwargs else None
-            state = kwargs.pop("state") if "state" in kwargs else None
-            if params and state:
-                variables = {**params, **state}
-            elif params:
-                variables = params
-            elif state:
-                variables = state
-            else:
-                variables = None
-            kwargs["variables"] = variables
-            flax_model = flax_model_class()
-            if flax_model_method:
-                kwargs["method"] = getattr(flax_model, flax_model_method)
-            if backend.backend() == "jax":
-                return FlaxLayer(flax_model_class(), **kwargs)
-            elif backend.backend() == "tensorflow":
-                return FlaxLayer(flax_model, stateless_compute_output_shape, **kwargs)
-    
-    
->       self._test_layer(
-            flax_model_class.__name__,
-            create_wrapper,
-            init_kwargs,
-            trainable_weights,
-            trainable_params,
-            non_trainable_weights,
-            non_trainable_params,
-        )
-
-keras/src/utils/jax_layer_test.py:497: 
-_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
-keras/src/utils/jax_layer_test.py:254: in _test_layer
-    model1.fit(x_train, y_train, epochs=1, steps_per_epoch=10)
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/backend/tensorflow/trainer.py:399: in fit
-    logs = self.train_function(iterator)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/backend/tensorflow/trainer.py:241: in function
-    opt_outputs = multi_step_on_iterator(iterator)
-                  ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
-    return func(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^
-keras/src/backend/tensorflow/trainer.py:154: in multi_step_on_iterator
-    one_step_on_data(iterator.get_next())
-keras/src/backend/tensorflow/trainer.py:125: in wrapper
-    result = step_func(converted_data)
-             ^^^^^^^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
-    return func(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^
-keras/src/backend/tensorflow/trainer.py:134: in one_step_on_data
-    outputs = self.distribute_strategy.run(step_function, args=(data,))
-              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:1673: in run
-    return self._extended.call_for_each_replica(fn, args=args, kwargs=kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:3263: in call_for_each_replica
-    return self._call_for_each_replica(fn, args, kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:4061: in _call_for_each_replica
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
-    return func(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^
-keras/src/backend/tensorflow/trainer.py:59: in train_step
-    y_pred = self(x, training=True)
-             ^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/layers/layer.py:941: in __call__
-    outputs = super().__call__(*args, **kwargs)
-              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/ops/operation.py:77: in __call__
-    return self.call(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/models/functional.py:183: in call
-    outputs = self._run_through_graph(
-keras/src/ops/function.py:206: in _run_through_graph
-    outputs = op(*args, **kwargs)
-              ^^^^^^^^^^^^^^^^^^^
-keras/src/models/functional.py:644: in call
-    return operation(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/layers/layer.py:939: in __call__
-    outputs = super().__call__(*args, **kwargs)
-              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/ops/operation.py:77: in __call__
-    return self.call(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/jax_layer.py:612: in call
-    return call_with_fn(self.jax2tf_training_true_fn)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/jax_layer.py:586: in call_with_fn
-    jax.tree_util.tree_map(
-_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
-
-f = <function JaxLayer.call.<locals>.assign_state_to_variable at 0x36e43ad40>
-tree = {}, is_leaf = None, rest = (DictWrapper({}),), leaves = []
-treedef = PyTreeDef({})
-
-    @export
-    def tree_map(f: Callable[..., Any],
-                 tree: Any,
-                 *rest: Any,
-                 is_leaf: Callable[[Any], bool] | None = None) -> Any:
-      """Alias of :func:`jax.tree.map`."""
-      leaves, treedef = tree_flatten(tree, is_leaf)
->     all_leaves = [leaves] + [treedef.flatten_up_to(r) for r in rest]
-                               ^^^^^^^^^^^^^^^^^^^^^^^^
-E     ValueError: Expected dict, got DictWrapper({}).
-
-venv/lib/python3.12/site-packages/jax/_src/tree_util.py:357: ValueError
------------------------------ Captured stdout call -----------------------------
-Model: "FlaxDropoutModel1"
-┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━┓
-┃ Layer (type)                    ┃ Output Shape           ┃       Param # ┃
-┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━┩
-│ input_layer (InputLayer)        │ (None, 28, 28, 1)      │             0 │
-├─────────────────────────────────┼────────────────────────┼───────────────┤
-│ flax_layer (FlaxLayer)          │ (None, 10)             │       648,226 │
-└─────────────────────────────────┴────────────────────────┴───────────────┘
- Total params: 648,226 (2.47 MB)
- Trainable params: 648,226 (2.47 MB)
- Non-trainable params: 0 (0.00 B)
-__ TestJaxLayer.test_state_mismatch_during_update_mapping_instead_of_sequence __
-ValueError: Expected dict, got DictWrapper({'state': DictWrapper({'foo': <Variable path=jax_layer/variable, shape=(), dtype=float32, value=0.0>})}).
-
-During handling of the above exception, another exception occurred:
-
-self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_state_mismatch_during_update_mapping_instead_of_sequence>
-init_state = {'state': {'foo': 0.0}}, error_regex = 'Structure mismatch'
-
-    @parameterized.named_parameters(
-        {
-            "testcase_name": "sequence_instead_of_mapping",
-            "init_state": [0.0],
-            "error_regex": "Structure mismatch",
-        },
-        {
-            "testcase_name": "mapping_instead_of_sequence",
-            "init_state": {"state": {"foo": 0.0}},
-            "error_regex": "Structure mismatch",
-        },
-        {
-            "testcase_name": "sequence_instead_of_variable",
-            "init_state": {"state": [[0.0]]},
-            "error_regex": "Structure mismatch",
-        },
-        {
-            "testcase_name": "no_initial_state",
-            "init_state": None,
-            "error_regex": "Structure mismatch",
-        },
-        {
-            "testcase_name": "missing_dict_key",
-            "init_state": {"state": {}},
-            "error_regex": "Structure mismatch ",
-        },
-        {
-            "testcase_name": "missing_variable_in_list",
-            "init_state": {"state": {"foo": [2.0]}},
-            "error_regex": "Structure mismatch",
-        },
-    )
-    def test_state_mismatch_during_update(self, init_state, error_regex):
-        def jax_fn(params, state, inputs):
-            return inputs, {"state": [jnp.ones([])]}
-    
-        layer = JaxLayer(jax_fn, params={}, state=init_state)
->       with self.assertRaisesRegex(ValueError, error_regex):
-             ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-E       AssertionError: "Structure mismatch" does not match "Expected dict, got DictWrapper({'state': DictWrapper({'foo': <Variable path=jax_layer/variable, shape=(), dtype=float32, value=0.0>})})."
-
-keras/src/utils/jax_layer_test.py:712: AssertionError
-_______ TestJaxLayer.test_state_mismatch_during_update_missing_dict_key ________
-ValueError: Expected dict, got DictWrapper({'state': DictWrapper({})}).
-
-During handling of the above exception, another exception occurred:
-
-self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_state_mismatch_during_update_missing_dict_key>
-init_state = {'state': {}}, error_regex = 'Structure mismatch '
-
-    @parameterized.named_parameters(
-        {
-            "testcase_name": "sequence_instead_of_mapping",
-            "init_state": [0.0],
-            "error_regex": "Structure mismatch",
-        },
-        {
-            "testcase_name": "mapping_instead_of_sequence",
-            "init_state": {"state": {"foo": 0.0}},
-            "error_regex": "Structure mismatch",
-        },
-        {
-            "testcase_name": "sequence_instead_of_variable",
-            "init_state": {"state": [[0.0]]},
-            "error_regex": "Structure mismatch",
-        },
-        {
-            "testcase_name": "no_initial_state",
-            "init_state": None,
-            "error_regex": "Structure mismatch",
-        },
-        {
-            "testcase_name": "missing_dict_key",
-            "init_state": {"state": {}},
-            "error_regex": "Structure mismatch ",
-        },
-        {
-            "testcase_name": "missing_variable_in_list",
-            "init_state": {"state": {"foo": [2.0]}},
-            "error_regex": "Structure mismatch",
-        },
-    )
-    def test_state_mismatch_during_update(self, init_state, error_regex):
-        def jax_fn(params, state, inputs):
-            return inputs, {"state": [jnp.ones([])]}
-    
-        layer = JaxLayer(jax_fn, params={}, state=init_state)
->       with self.assertRaisesRegex(ValueError, error_regex):
-             ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-E       AssertionError: "Structure mismatch " does not match "Expected dict, got DictWrapper({'state': DictWrapper({})})."
-
-keras/src/utils/jax_layer_test.py:712: AssertionError
-___ TestJaxLayer.test_state_mismatch_during_update_missing_variable_in_list ____
-ValueError: Expected dict, got DictWrapper({'state': DictWrapper({'foo': ListWrapper([<Variable path=jax_layer/variable, shape=(), dtype=float32, value=2.0>])})}).
-
-During handling of the above exception, another exception occurred:
-
-self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_state_mismatch_during_update_missing_variable_in_list>
-init_state = {'state': {'foo': [2.0]}}, error_regex = 'Structure mismatch'
-
-    @parameterized.named_parameters(
-        {
-            "testcase_name": "sequence_instead_of_mapping",
-            "init_state": [0.0],
-            "error_regex": "Structure mismatch",
-        },
-        {
-            "testcase_name": "mapping_instead_of_sequence",
-            "init_state": {"state": {"foo": 0.0}},
-            "error_regex": "Structure mismatch",
-        },
-        {
-            "testcase_name": "sequence_instead_of_variable",
-            "init_state": {"state": [[0.0]]},
-            "error_regex": "Structure mismatch",
-        },
-        {
-            "testcase_name": "no_initial_state",
-            "init_state": None,
-            "error_regex": "Structure mismatch",
-        },
-        {
-            "testcase_name": "missing_dict_key",
-            "init_state": {"state": {}},
-            "error_regex": "Structure mismatch ",
-        },
-        {
-            "testcase_name": "missing_variable_in_list",
-            "init_state": {"state": {"foo": [2.0]}},
-            "error_regex": "Structure mismatch",
-        },
-    )
-    def test_state_mismatch_during_update(self, init_state, error_regex):
-        def jax_fn(params, state, inputs):
-            return inputs, {"state": [jnp.ones([])]}
-    
-        layer = JaxLayer(jax_fn, params={}, state=init_state)
->       with self.assertRaisesRegex(ValueError, error_regex):
-             ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-E       AssertionError: "Structure mismatch" does not match "Expected dict, got DictWrapper({'state': DictWrapper({'foo': ListWrapper([<Variable path=jax_layer/variable, shape=(), dtype=float32, value=2.0>])})})."
-
-keras/src/utils/jax_layer_test.py:712: AssertionError
-_______ TestJaxLayer.test_state_mismatch_during_update_no_initial_state ________
-ValueError: Expected dict, got None.
-
-During handling of the above exception, another exception occurred:
-
-self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_state_mismatch_during_update_no_initial_state>
-init_state = None, error_regex = 'Structure mismatch'
-
-    @parameterized.named_parameters(
-        {
-            "testcase_name": "sequence_instead_of_mapping",
-            "init_state": [0.0],
-            "error_regex": "Structure mismatch",
-        },
-        {
-            "testcase_name": "mapping_instead_of_sequence",
-            "init_state": {"state": {"foo": 0.0}},
-            "error_regex": "Structure mismatch",
-        },
-        {
-            "testcase_name": "sequence_instead_of_variable",
-            "init_state": {"state": [[0.0]]},
-            "error_regex": "Structure mismatch",
-        },
-        {
-            "testcase_name": "no_initial_state",
-            "init_state": None,
-            "error_regex": "Structure mismatch",
-        },
-        {
-            "testcase_name": "missing_dict_key",
-            "init_state": {"state": {}},
-            "error_regex": "Structure mismatch ",
-        },
-        {
-            "testcase_name": "missing_variable_in_list",
-            "init_state": {"state": {"foo": [2.0]}},
-            "error_regex": "Structure mismatch",
-        },
-    )
-    def test_state_mismatch_during_update(self, init_state, error_regex):
-        def jax_fn(params, state, inputs):
-            return inputs, {"state": [jnp.ones([])]}
-    
-        layer = JaxLayer(jax_fn, params={}, state=init_state)
->       with self.assertRaisesRegex(ValueError, error_regex):
-             ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-E       AssertionError: "Structure mismatch" does not match "Expected dict, got None."
-
-keras/src/utils/jax_layer_test.py:712: AssertionError
-__ TestJaxLayer.test_state_mismatch_during_update_sequence_instead_of_mapping __
-ValueError: Expected dict, got ListWrapper([<Variable path=jax_layer/variable, shape=(), dtype=float32, value=0.0>]).
-
-During handling of the above exception, another exception occurred:
-
-self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_state_mismatch_during_update_sequence_instead_of_mapping>
-init_state = [0.0], error_regex = 'Structure mismatch'
-
-    @parameterized.named_parameters(
-        {
-            "testcase_name": "sequence_instead_of_mapping",
-            "init_state": [0.0],
-            "error_regex": "Structure mismatch",
-        },
-        {
-            "testcase_name": "mapping_instead_of_sequence",
-            "init_state": {"state": {"foo": 0.0}},
-            "error_regex": "Structure mismatch",
-        },
-        {
-            "testcase_name": "sequence_instead_of_variable",
-            "init_state": {"state": [[0.0]]},
-            "error_regex": "Structure mismatch",
-        },
-        {
-            "testcase_name": "no_initial_state",
-            "init_state": None,
-            "error_regex": "Structure mismatch",
-        },
-        {
-            "testcase_name": "missing_dict_key",
-            "init_state": {"state": {}},
-            "error_regex": "Structure mismatch ",
-        },
-        {
-            "testcase_name": "missing_variable_in_list",
-            "init_state": {"state": {"foo": [2.0]}},
-            "error_regex": "Structure mismatch",
-        },
-    )
-    def test_state_mismatch_during_update(self, init_state, error_regex):
-        def jax_fn(params, state, inputs):
-            return inputs, {"state": [jnp.ones([])]}
-    
-        layer = JaxLayer(jax_fn, params={}, state=init_state)
->       with self.assertRaisesRegex(ValueError, error_regex):
-             ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-E       AssertionError: "Structure mismatch" does not match "Expected dict, got ListWrapper([<Variable path=jax_layer/variable, shape=(), dtype=float32, value=0.0>])."
-
-keras/src/utils/jax_layer_test.py:712: AssertionError
-_ TestJaxLayer.test_state_mismatch_during_update_sequence_instead_of_variable __
-ValueError: Expected dict, got DictWrapper({'state': ListWrapper([ListWrapper([<Variable path=jax_layer/variable, shape=(), dtype=float32, value=0.0>])])}).
-
-During handling of the above exception, another exception occurred:
-
-self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_state_mismatch_during_update_sequence_instead_of_variable>
-init_state = {'state': [[0.0]]}, error_regex = 'Structure mismatch'
-
-    @parameterized.named_parameters(
-        {
-            "testcase_name": "sequence_instead_of_mapping",
-            "init_state": [0.0],
-            "error_regex": "Structure mismatch",
-        },
-        {
-            "testcase_name": "mapping_instead_of_sequence",
-            "init_state": {"state": {"foo": 0.0}},
-            "error_regex": "Structure mismatch",
-        },
-        {
-            "testcase_name": "sequence_instead_of_variable",
-            "init_state": {"state": [[0.0]]},
-            "error_regex": "Structure mismatch",
-        },
-        {
-            "testcase_name": "no_initial_state",
-            "init_state": None,
-            "error_regex": "Structure mismatch",
-        },
-        {
-            "testcase_name": "missing_dict_key",
-            "init_state": {"state": {}},
-            "error_regex": "Structure mismatch ",
-        },
-        {
-            "testcase_name": "missing_variable_in_list",
-            "init_state": {"state": {"foo": [2.0]}},
-            "error_regex": "Structure mismatch",
-        },
-    )
-    def test_state_mismatch_during_update(self, init_state, error_regex):
-        def jax_fn(params, state, inputs):
-            return inputs, {"state": [jnp.ones([])]}
-    
-        layer = JaxLayer(jax_fn, params={}, state=init_state)
->       with self.assertRaisesRegex(ValueError, error_regex):
-             ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-E       AssertionError: "Structure mismatch" does not match "Expected dict, got DictWrapper({'state': ListWrapper([ListWrapper([<Variable path=jax_layer/variable, shape=(), dtype=float32, value=0.0>])])})."
-
-keras/src/utils/jax_layer_test.py:712: AssertionError
-_______________ TestJaxLayer.test_with_different_argument_order ________________
-
-self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_with_different_argument_order>
-
-    def test_with_different_argument_order(self):
-        def jax_call_fn(training, inputs, rng, state, params):
-            return inputs, {}
-    
-        def jax_init_fn(training, inputs, rng):
-            return {}, {}
-    
-        layer = JaxLayer(jax_call_fn, jax_init_fn)
->       layer(np.ones((1,)))
-
-keras/src/utils/jax_layer_test.py:532: 
-_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/layers/layer.py:941: in __call__
-    outputs = super().__call__(*args, **kwargs)
-              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/ops/operation.py:77: in __call__
-    return self.call(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/jax_layer.py:614: in call
-    return call_with_fn(self.jax2tf_training_false_fn)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/jax_layer.py:586: in call_with_fn
-    jax.tree_util.tree_map(
-_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
-
-f = <function JaxLayer.call.<locals>.assign_state_to_variable at 0x393b49940>
-tree = {}, is_leaf = None, rest = (DictWrapper({}),), leaves = []
-treedef = PyTreeDef({})
-
-    @export
-    def tree_map(f: Callable[..., Any],
-                 tree: Any,
-                 *rest: Any,
-                 is_leaf: Callable[[Any], bool] | None = None) -> Any:
-      """Alias of :func:`jax.tree.map`."""
-      leaves, treedef = tree_flatten(tree, is_leaf)
->     all_leaves = [leaves] + [treedef.flatten_up_to(r) for r in rest]
-                               ^^^^^^^^^^^^^^^^^^^^^^^^
-E     ValueError: Expected dict, got DictWrapper({}).
-
-venv/lib/python3.12/site-packages/jax/_src/tree_util.py:357: ValueError
-_________________ TestJaxLayer.test_with_flax_state_no_params __________________
-
-self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_with_flax_state_no_params>
-
-    @pytest.mark.skipif(flax is None, reason="Flax library is not available.")
-    def test_with_flax_state_no_params(self):
-        class MyFlaxLayer(flax.linen.Module):
-            @flax.linen.compact
-            def __call__(self, x):
-                def zeros_init(shape):
-                    return jnp.zeros(shape, jnp.int32)
-    
-                count = self.variable("a", "b", zeros_init, [])
-                count.value = count.value + 1
-                return x
-    
-        layer = FlaxLayer(MyFlaxLayer(), variables={"a": {"b": 0}})
->       layer(np.ones((1,)))
-
-keras/src/utils/jax_layer_test.py:634: 
-_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/layers/layer.py:941: in __call__
-    outputs = super().__call__(*args, **kwargs)
-              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/ops/operation.py:77: in __call__
-    return self.call(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/jax_layer.py:609: in call
-    return call_with_fn(self.jax2tf_training_false_fn)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/jax_layer.py:586: in call_with_fn
-    jax.tree_util.tree_map(
-_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
-
-f = <function JaxLayer.call.<locals>.assign_state_to_variable at 0x393b7aa20>
-tree = {'a': {'b': <tf.Tensor: shape=(), dtype=int32, numpy=1>}}, is_leaf = None
-rest = (DictWrapper({'a': DictWrapper({'b': <Variable path=flax_layer/variable, shape=(), dtype=int64, value=0>})}),)
-leaves = [<tf.Tensor: shape=(), dtype=int32, numpy=1>]
-treedef = PyTreeDef({'a': {'b': *}})
-
-    @export
-    def tree_map(f: Callable[..., Any],
-                 tree: Any,
-                 *rest: Any,
-                 is_leaf: Callable[[Any], bool] | None = None) -> Any:
-      """Alias of :func:`jax.tree.map`."""
-      leaves, treedef = tree_flatten(tree, is_leaf)
->     all_leaves = [leaves] + [treedef.flatten_up_to(r) for r in rest]
-                               ^^^^^^^^^^^^^^^^^^^^^^^^
-E     ValueError: Expected dict, got DictWrapper({'a': DictWrapper({'b': <Variable path=flax_layer/variable, shape=(), dtype=int64, value=0>})}).
-
-venv/lib/python3.12/site-packages/jax/_src/tree_util.py:357: ValueError
-____________ TestJaxLayer.test_with_state_jax_registered_node_class ____________
-
-self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_with_state_jax_registered_node_class>
-
-    def test_with_state_jax_registered_node_class(self):
-        @jax.tree_util.register_pytree_node_class
-        class NamedPoint:
-            def __init__(self, x, y, name):
-                self.x = x
-                self.y = y
-                self.name = name
-    
-            def tree_flatten(self):
-                return ((self.x, self.y), self.name)
-    
-            @classmethod
-            def tree_unflatten(cls, aux_data, children):
-                return cls(*children, aux_data)
-    
-        def jax_fn(params, state, inputs):
-            return inputs, state
-    
-        layer = JaxLayer(jax_fn, state=[NamedPoint(1.0, 2.0, "foo")])
->       layer(np.ones((1,)))
-
-keras/src/utils/jax_layer_test.py:673: 
-_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/layers/layer.py:941: in __call__
-    outputs = super().__call__(*args, **kwargs)
-              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/ops/operation.py:77: in __call__
-    return self.call(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/jax_layer.py:609: in call
-    return call_with_fn(self.jax2tf_training_false_fn)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/jax_layer.py:586: in call_with_fn
-    jax.tree_util.tree_map(
-_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
-
-f = <function JaxLayer.call.<locals>.assign_state_to_variable at 0x395be4680>
-tree = [<keras.src.utils.jax_layer_test.TestJaxLayer.test_with_state_jax_registered_node_class.<locals>.NamedPoint object at 0x396832d50>]
-is_leaf = None
-rest = (ListWrapper([<keras.src.utils.jax_layer_test.TestJaxLayer.test_with_state_jax_registered_node_class.<locals>.NamedPoint object at 0x3923390a0>]),)
-leaves = [<tf.Tensor: shape=(), dtype=float32, numpy=1.0>, <tf.Tensor: shape=(), dtype=float32, numpy=2.0>]
-treedef = PyTreeDef([CustomNode(NamedPoint[foo], [*, *])])
-
-    @export
-    def tree_map(f: Callable[..., Any],
-                 tree: Any,
-                 *rest: Any,
-                 is_leaf: Callable[[Any], bool] | None = None) -> Any:
-      """Alias of :func:`jax.tree.map`."""
-      leaves, treedef = tree_flatten(tree, is_leaf)
->     all_leaves = [leaves] + [treedef.flatten_up_to(r) for r in rest]
-                               ^^^^^^^^^^^^^^^^^^^^^^^^
-E     ValueError: Expected list, got ListWrapper([<keras.src.utils.jax_layer_test.TestJaxLayer.test_with_state_jax_registered_node_class.<locals>.NamedPoint object at 0x3923390a0>]).
-
-venv/lib/python3.12/site-packages/jax/_src/tree_util.py:357: ValueError
-__________ TestJaxLayer.test_with_training_in_call_fn_but_not_init_fn __________
-
-self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_with_training_in_call_fn_but_not_init_fn>
-
-    def test_with_training_in_call_fn_but_not_init_fn(self):
-        def jax_call_fn(params, state, rng, inputs, training):
-            return inputs, {}
-    
-        def jax_init_fn(rng, inputs):
-            return {}, {}
-    
-        layer = JaxLayer(jax_call_fn, jax_init_fn)
->       layer(np.ones((1,)))
-
-keras/src/utils/jax_layer_test.py:522: 
-_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/layers/layer.py:941: in __call__
-    outputs = super().__call__(*args, **kwargs)
-              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/ops/operation.py:77: in __call__
-    return self.call(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/jax_layer.py:614: in call
-    return call_with_fn(self.jax2tf_training_false_fn)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/jax_layer.py:586: in call_with_fn
-    jax.tree_util.tree_map(
-_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
-
-f = <function JaxLayer.call.<locals>.assign_state_to_variable at 0x395b993a0>
-tree = {}, is_leaf = None, rest = (DictWrapper({}),), leaves = []
-treedef = PyTreeDef({})
-
-    @export
-    def tree_map(f: Callable[..., Any],
-                 tree: Any,
-                 *rest: Any,
-                 is_leaf: Callable[[Any], bool] | None = None) -> Any:
-      """Alias of :func:`jax.tree.map`."""
-      leaves, treedef = tree_flatten(tree, is_leaf)
->     all_leaves = [leaves] + [treedef.flatten_up_to(r) for r in rest]
-                               ^^^^^^^^^^^^^^^^^^^^^^^^
-E     ValueError: Expected dict, got DictWrapper({}).
-
-venv/lib/python3.12/site-packages/jax/_src/tree_util.py:357: ValueError
-=========================== short test summary info ============================
-FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_flax_layer_training_independent_bound_method - ValueError: Expected dict, got DictWrapper({}).
-FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_flax_layer_training_rng_state_no_method - ValueError: Expected dict, got DictWrapper({'batch_stats': DictWrapper({'BatchNorm_0': DictWrapper({'mean': <Variable path=flax_layer/variable_13, shape=(12,), dtype=float32, value=[0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.]>, 'var': <Variable path=flax_layer/variable_14, shape=(12,), dtype=float32, value=[1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.]>}), 'BatchNorm_1': DictWrapper({'mean': <Variable path=flax_layer/variable_15, shape=(24,), dtype=float32, value=[0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.]>, 'var': <Variable path=flax_layer/variable_16, shape=(24,), dtype=float32, value=[1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.]>}), 'BatchNorm_2': DictWrapper({'mean': <Variable path=flax_layer/variable_17, shape=(32,), dtype=float32, value=[0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
- 0. 0. 0. 0. 0. 0. 0. 0.]>, 'var': <Variable path=flax_layer/variable_18, shape=(32,), dtype=float32, value=[1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
- 1. 1. 1. 1. 1. 1. 1. 1.]>}), 'BatchNorm_3': DictWrapper({'mean': <Variable path=flax_layer/variable_19, shape=(200,), dtype=float32, value=[0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
- 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
- 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
- 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
- 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
- 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
- 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
- 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
- 0. 0. 0. 0. 0. 0. 0. 0.]>, 'var': <Variable path=flax_layer/variable_20, shape=(200,), dtype=float32, value=[1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
- 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
- 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
- 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
- 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
- 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
- 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
- 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
- 1. 1. 1. 1. 1. 1. 1. 1.]>})})}).
-FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_flax_layer_training_rng_unbound_method - ValueError: Expected dict, got DictWrapper({}).
-FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_flax_layer_training_rng_unbound_method_dtype_policy - ValueError: Expected dict, got DictWrapper({}).
-FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_state_mismatch_during_update_mapping_instead_of_sequence - AssertionError: "Structure mismatch" does not match "Expected dict, got DictWrapper({'state': DictWrapper({'foo': <Variable path=jax_layer/variable, shape=(), dtype=float32, value=0.0>})})."
-FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_state_mismatch_during_update_missing_dict_key - AssertionError: "Structure mismatch " does not match "Expected dict, got DictWrapper({'state': DictWrapper({})})."
-FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_state_mismatch_during_update_missing_variable_in_list - AssertionError: "Structure mismatch" does not match "Expected dict, got DictWrapper({'state': DictWrapper({'foo': ListWrapper([<Variable path=jax_layer/variable, shape=(), dtype=float32, value=2.0>])})})."
-FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_state_mismatch_during_update_no_initial_state - AssertionError: "Structure mismatch" does not match "Expected dict, got None."
-FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_state_mismatch_during_update_sequence_instead_of_mapping - AssertionError: "Structure mismatch" does not match "Expected dict, got ListWrapper([<Variable path=jax_layer/variable, shape=(), dtype=float32, value=0.0>])."
-FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_state_mismatch_during_update_sequence_instead_of_variable - AssertionError: "Structure mismatch" does not match "Expected dict, got DictWrapper({'state': ListWrapper([ListWrapper([<Variable path=jax_layer/variable, shape=(), dtype=float32, value=0.0>])])})."
-FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_different_argument_order - ValueError: Expected dict, got DictWrapper({}).
-FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_flax_state_no_params - ValueError: Expected dict, got DictWrapper({'a': DictWrapper({'b': <Variable path=flax_layer/variable, shape=(), dtype=int64, value=0>})}).
-FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_state_jax_registered_node_class - ValueError: Expected list, got ListWrapper([<keras.src.utils.jax_layer_test.TestJaxLayer.test_with_state_jax_registered_node_class.<locals>.NamedPoint object at 0x3923390a0>]).
-FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_training_in_call_fn_but_not_init_fn - ValueError: Expected dict, got DictWrapper({}).
-======================== 14 failed, 14 passed in 8.05s =========================
-============================= test session starts ==============================
-platform darwin -- Python 3.12.10, pytest-8.4.2, pluggy-1.6.0 -- /Users/wenyiguo/keras/venv/bin/python3.12
-cachedir: .pytest_cache
-rootdir: /Users/wenyiguo/keras
-configfile: pyproject.toml
-plugins: cov-7.0.0
-collecting ... collected 2 items
-
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_flax_layer_training_independent_bound_method FAILED [ 50%]
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_flax_layer_training_rng_unbound_method FAILED [100%]
-
-=================================== FAILURES ===================================
-________ TestJaxLayer.test_flax_layer_training_independent_bound_method ________
-
-self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_flax_layer_training_independent_bound_method>
-flax_model_class = <class 'keras.src.utils.jax_layer_test.FlaxTrainingIndependentModel'>
-flax_model_method = 'forward', init_kwargs = {}, trainable_weights = 8
-trainable_params = 648226, non_trainable_weights = 0, non_trainable_params = 0
-
-    @parameterized.named_parameters(
-        {
-            "testcase_name": "training_independent_bound_method",
-            "flax_model_class": "FlaxTrainingIndependentModel",
-            "flax_model_method": "forward",
-            "init_kwargs": {},
-            "trainable_weights": 8,
-            "trainable_params": 648226,
-            "non_trainable_weights": 0,
-            "non_trainable_params": 0,
-        },
-        {
-            "testcase_name": "training_rng_unbound_method",
-            "flax_model_class": "FlaxDropoutModel",
-            "flax_model_method": None,
-            "init_kwargs": {
-                "method": "flax_dropout_wrapper",
-            },
-            "trainable_weights": 8,
-            "trainable_params": 648226,
-            "non_trainable_weights": 0,
-            "non_trainable_params": 0,
-        },
-        # {
-        #     "testcase_name": "training_rng_state_no_method",
-        #     "flax_model_class": "FlaxBatchNormModel",
-        #     "flax_model_method": None,
-        #     "init_kwargs": {},
-        #     "trainable_weights": 13,
-        #     "trainable_params": 354258,
-        #     "non_trainable_weights": 8,
-        #     "non_trainable_params": 536,
-        # },
-        # {
-        #     "testcase_name": "training_rng_unbound_method_dtype_policy",
-        #     "flax_model_class": "FlaxDropoutModel",
-        #     "flax_model_method": None,
-        #     "init_kwargs": {
-        #         "method": "flax_dropout_wrapper",
-        #         "dtype": DTypePolicy("mixed_float16"),
-        #     },
-        #     "trainable_weights": 8,
-        #     "trainable_params": 648226,
-        #     "non_trainable_weights": 0,
-        #     "non_trainable_params": 0,
-        # },
-    )
-    @pytest.mark.skipif(flax is None, reason="Flax library is not available.")
-    def test_flax_layer(
-        self,
-        flax_model_class,
-        flax_model_method,
-        init_kwargs,
-        trainable_weights,
-        trainable_params,
-        non_trainable_weights,
-        non_trainable_params,
-    ):
-        flax_model_class = FLAX_OBJECTS.get(flax_model_class)
-        if "method" in init_kwargs:
-            init_kwargs["method"] = FLAX_OBJECTS.get(init_kwargs["method"])
-    
-        def create_wrapper(**kwargs):
-            params = kwargs.pop("params") if "params" in kwargs else None
-            state = kwargs.pop("state") if "state" in kwargs else None
-            if params and state:
-                variables = {**params, **state}
-            elif params:
-                variables = params
-            elif state:
-                variables = state
-            else:
-                variables = None
-            kwargs["variables"] = variables
-            flax_model = flax_model_class()
-            if flax_model_method:
-                kwargs["method"] = getattr(flax_model, flax_model_method)
-            if backend.backend() == "jax":
-                return FlaxLayer(flax_model_class(), **kwargs)
-            elif backend.backend() == "tensorflow":
-                return FlaxLayer(flax_model, stateless_compute_output_shape, **kwargs)
-    
-    
->       self._test_layer(
-            flax_model_class.__name__,
-            create_wrapper,
-            init_kwargs,
-            trainable_weights,
-            trainable_params,
-            non_trainable_weights,
-            non_trainable_params,
-        )
-
-keras/src/utils/jax_layer_test.py:497: 
-_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
-keras/src/utils/jax_layer_test.py:254: in _test_layer
-    model1.fit(x_train, y_train, epochs=1, steps_per_epoch=10)
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/backend/tensorflow/trainer.py:399: in fit
-    logs = self.train_function(iterator)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/backend/tensorflow/trainer.py:241: in function
-    opt_outputs = multi_step_on_iterator(iterator)
-                  ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
-    return func(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^
-keras/src/backend/tensorflow/trainer.py:154: in multi_step_on_iterator
-    one_step_on_data(iterator.get_next())
-keras/src/backend/tensorflow/trainer.py:125: in wrapper
-    result = step_func(converted_data)
-             ^^^^^^^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
-    return func(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^
-keras/src/backend/tensorflow/trainer.py:134: in one_step_on_data
-    outputs = self.distribute_strategy.run(step_function, args=(data,))
-              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:1673: in run
-    return self._extended.call_for_each_replica(fn, args=args, kwargs=kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:3263: in call_for_each_replica
-    return self._call_for_each_replica(fn, args, kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:4061: in _call_for_each_replica
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
-    return func(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^
-keras/src/backend/tensorflow/trainer.py:59: in train_step
-    y_pred = self(x, training=True)
-             ^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/layers/layer.py:941: in __call__
-    outputs = super().__call__(*args, **kwargs)
-              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/ops/operation.py:77: in __call__
-    return self.call(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/models/functional.py:183: in call
-    outputs = self._run_through_graph(
-keras/src/ops/function.py:206: in _run_through_graph
-    outputs = op(*args, **kwargs)
-              ^^^^^^^^^^^^^^^^^^^
-keras/src/models/functional.py:644: in call
-    return operation(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/layers/layer.py:941: in __call__
-    outputs = super().__call__(*args, **kwargs)
-              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/ops/operation.py:77: in __call__
-    return self.call(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/jax_layer.py:609: in call
-    return call_with_fn(self.jax2tf_training_false_fn)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/jax_layer.py:586: in call_with_fn
-    jax.tree_util.tree_map(
-_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
-
-f = <function JaxLayer.call.<locals>.assign_state_to_variable at 0x31d82f740>
-tree = {}, is_leaf = None, rest = (DictWrapper({}),), leaves = []
-treedef = PyTreeDef({})
-
-    @export
-    def tree_map(f: Callable[..., Any],
-                 tree: Any,
-                 *rest: Any,
-                 is_leaf: Callable[[Any], bool] | None = None) -> Any:
-      """Alias of :func:`jax.tree.map`."""
-      leaves, treedef = tree_flatten(tree, is_leaf)
->     all_leaves = [leaves] + [treedef.flatten_up_to(r) for r in rest]
-                               ^^^^^^^^^^^^^^^^^^^^^^^^
-E     ValueError: Expected dict, got DictWrapper({}).
-
-venv/lib/python3.12/site-packages/jax/_src/tree_util.py:357: ValueError
------------------------------ Captured stdout call -----------------------------
-Model: "FlaxTrainingIndependentModel1"
-┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━┓
-┃ Layer (type)                    ┃ Output Shape           ┃       Param # ┃
-┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━┩
-│ input_layer (InputLayer)        │ (None, 28, 28, 1)      │             0 │
-├─────────────────────────────────┼────────────────────────┼───────────────┤
-│ flax_layer (FlaxLayer)          │ (None, 10)             │       648,226 │
-└─────────────────────────────────┴────────────────────────┴───────────────┘
- Total params: 648,226 (2.47 MB)
- Trainable params: 648,226 (2.47 MB)
- Non-trainable params: 0 (0.00 B)
------------------------------ Captured stderr call -----------------------------
-WARNING: All log messages before absl::InitializeLog() is called are written to STDERR
-I0000 00:00:1762560267.960370 1451585 service.cc:148] XLA service 0x15533c0f0 initialized for platform Host (this does not guarantee that XLA will be used). Devices:
-I0000 00:00:1762560267.960444 1451585 service.cc:156]   StreamExecutor device (0): Host, Default Version
-I0000 00:00:1762560267.986555 1451585 device_compiler.h:188] Compiled cluster using XLA!  This line is logged at most once for the lifetime of the process.
-___________ TestJaxLayer.test_flax_layer_training_rng_unbound_method ___________
-
-self = <keras.src.utils.jax_layer_test.TestJaxLayer testMethod=test_flax_layer_training_rng_unbound_method>
-flax_model_class = <class 'keras.src.utils.jax_layer_test.FlaxDropoutModel'>
-flax_model_method = None
-init_kwargs = {'method': <function flax_dropout_wrapper at 0x1549f8900>}
-trainable_weights = 8, trainable_params = 648226, non_trainable_weights = 0
-non_trainable_params = 0
-
-    @parameterized.named_parameters(
-        {
-            "testcase_name": "training_independent_bound_method",
-            "flax_model_class": "FlaxTrainingIndependentModel",
-            "flax_model_method": "forward",
-            "init_kwargs": {},
-            "trainable_weights": 8,
-            "trainable_params": 648226,
-            "non_trainable_weights": 0,
-            "non_trainable_params": 0,
-        },
-        {
-            "testcase_name": "training_rng_unbound_method",
-            "flax_model_class": "FlaxDropoutModel",
-            "flax_model_method": None,
-            "init_kwargs": {
-                "method": "flax_dropout_wrapper",
-            },
-            "trainable_weights": 8,
-            "trainable_params": 648226,
-            "non_trainable_weights": 0,
-            "non_trainable_params": 0,
-        },
-        # {
-        #     "testcase_name": "training_rng_state_no_method",
-        #     "flax_model_class": "FlaxBatchNormModel",
-        #     "flax_model_method": None,
-        #     "init_kwargs": {},
-        #     "trainable_weights": 13,
-        #     "trainable_params": 354258,
-        #     "non_trainable_weights": 8,
-        #     "non_trainable_params": 536,
-        # },
-        # {
-        #     "testcase_name": "training_rng_unbound_method_dtype_policy",
-        #     "flax_model_class": "FlaxDropoutModel",
-        #     "flax_model_method": None,
-        #     "init_kwargs": {
-        #         "method": "flax_dropout_wrapper",
-        #         "dtype": DTypePolicy("mixed_float16"),
-        #     },
-        #     "trainable_weights": 8,
-        #     "trainable_params": 648226,
-        #     "non_trainable_weights": 0,
-        #     "non_trainable_params": 0,
-        # },
-    )
-    @pytest.mark.skipif(flax is None, reason="Flax library is not available.")
-    def test_flax_layer(
-        self,
-        flax_model_class,
-        flax_model_method,
-        init_kwargs,
-        trainable_weights,
-        trainable_params,
-        non_trainable_weights,
-        non_trainable_params,
-    ):
-        flax_model_class = FLAX_OBJECTS.get(flax_model_class)
-        if "method" in init_kwargs:
-            init_kwargs["method"] = FLAX_OBJECTS.get(init_kwargs["method"])
-    
-        def create_wrapper(**kwargs):
-            params = kwargs.pop("params") if "params" in kwargs else None
-            state = kwargs.pop("state") if "state" in kwargs else None
-            if params and state:
-                variables = {**params, **state}
-            elif params:
-                variables = params
-            elif state:
-                variables = state
-            else:
-                variables = None
-            kwargs["variables"] = variables
-            flax_model = flax_model_class()
-            if flax_model_method:
-                kwargs["method"] = getattr(flax_model, flax_model_method)
-            if backend.backend() == "jax":
-                return FlaxLayer(flax_model_class(), **kwargs)
-            elif backend.backend() == "tensorflow":
-                return FlaxLayer(flax_model, stateless_compute_output_shape, **kwargs)
-    
-    
->       self._test_layer(
-            flax_model_class.__name__,
-            create_wrapper,
-            init_kwargs,
-            trainable_weights,
-            trainable_params,
-            non_trainable_weights,
-            non_trainable_params,
-        )
-
-keras/src/utils/jax_layer_test.py:497: 
-_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
-keras/src/utils/jax_layer_test.py:254: in _test_layer
-    model1.fit(x_train, y_train, epochs=1, steps_per_epoch=10)
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/backend/tensorflow/trainer.py:399: in fit
-    logs = self.train_function(iterator)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/backend/tensorflow/trainer.py:241: in function
-    opt_outputs = multi_step_on_iterator(iterator)
-                  ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
-    return func(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^
-keras/src/backend/tensorflow/trainer.py:154: in multi_step_on_iterator
-    one_step_on_data(iterator.get_next())
-keras/src/backend/tensorflow/trainer.py:125: in wrapper
-    result = step_func(converted_data)
-             ^^^^^^^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
-    return func(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^
-keras/src/backend/tensorflow/trainer.py:134: in one_step_on_data
-    outputs = self.distribute_strategy.run(step_function, args=(data,))
-              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:1673: in run
-    return self._extended.call_for_each_replica(fn, args=args, kwargs=kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:3263: in call_for_each_replica
-    return self._call_for_each_replica(fn, args, kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/distribute/distribute_lib.py:4061: in _call_for_each_replica
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-venv/lib/python3.12/site-packages/tensorflow/python/autograph/impl/api.py:643: in wrapper
-    return func(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^
-keras/src/backend/tensorflow/trainer.py:59: in train_step
-    y_pred = self(x, training=True)
-             ^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/layers/layer.py:941: in __call__
-    outputs = super().__call__(*args, **kwargs)
-              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/ops/operation.py:77: in __call__
-    return self.call(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/models/functional.py:183: in call
-    outputs = self._run_through_graph(
-keras/src/ops/function.py:206: in _run_through_graph
-    outputs = op(*args, **kwargs)
-              ^^^^^^^^^^^^^^^^^^^
-keras/src/models/functional.py:644: in call
-    return operation(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/layers/layer.py:941: in __call__
-    outputs = super().__call__(*args, **kwargs)
-              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/traceback_utils.py:113: in error_handler
-    return fn(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^
-keras/src/ops/operation.py:77: in __call__
-    return self.call(*args, **kwargs)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/jax_layer.py:612: in call
-    return call_with_fn(self.jax2tf_training_true_fn)
-           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
-keras/src/utils/jax_layer.py:586: in call_with_fn
-    jax.tree_util.tree_map(
-_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 
-
-f = <function JaxLayer.call.<locals>.assign_state_to_variable at 0x323642de0>
-tree = {}, is_leaf = None, rest = (DictWrapper({}),), leaves = []
-treedef = PyTreeDef({})
-
-    @export
-    def tree_map(f: Callable[..., Any],
-                 tree: Any,
-                 *rest: Any,
-                 is_leaf: Callable[[Any], bool] | None = None) -> Any:
-      """Alias of :func:`jax.tree.map`."""
-      leaves, treedef = tree_flatten(tree, is_leaf)
->     all_leaves = [leaves] + [treedef.flatten_up_to(r) for r in rest]
-                               ^^^^^^^^^^^^^^^^^^^^^^^^
-E     ValueError: Expected dict, got DictWrapper({}).
-
-venv/lib/python3.12/site-packages/jax/_src/tree_util.py:357: ValueError
------------------------------ Captured stdout call -----------------------------
-Model: "FlaxDropoutModel1"
-┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━┓
-┃ Layer (type)                    ┃ Output Shape           ┃       Param # ┃
-┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━┩
-│ input_layer (InputLayer)        │ (None, 28, 28, 1)      │             0 │
-├─────────────────────────────────┼────────────────────────┼───────────────┤
-│ flax_layer (FlaxLayer)          │ (None, 10)             │       648,226 │
-└─────────────────────────────────┴────────────────────────┴───────────────┘
- Total params: 648,226 (2.47 MB)
- Trainable params: 648,226 (2.47 MB)
- Non-trainable params: 0 (0.00 B)
-=========================== short test summary info ============================
-FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_flax_layer_training_independent_bound_method - ValueError: Expected dict, got DictWrapper({}).
-FAILED keras/src/utils/jax_layer_test.py::TestJaxLayer::test_flax_layer_training_rng_unbound_method - ValueError: Expected dict, got DictWrapper({}).
-============================== 2 failed in 1.45s ===============================
diff --git a/output.txt b/output.txt
deleted file mode 100644
index 6960ce8c14cb..000000000000
--- a/output.txt
+++ /dev/null
@@ -1,17 +0,0 @@
-============================= test session starts ==============================
-platform darwin -- Python 3.12.10, pytest-8.4.2, pluggy-1.6.0 -- /Users/wenyiguo/keras/venv/bin/python3.12
-cachedir: .pytest_cache
-rootdir: /Users/wenyiguo/keras
-configfile: pyproject.toml
-plugins: cov-7.0.0
-collecting ... collected 25 items / 24 deselected / 1 selected
-
-keras/src/utils/jax_layer_test.py::TestJaxLayer::test_with_state_none_leaves 
-self.state: {'foo': None}
-new_state: {'foo': None}
-self.state after:  {'foo': None}
-pytree name _DictWrapper
-pytree name _DictWrapper
-PASSED
-
-======================= 1 passed, 24 deselected in 0.10s =======================

From 015dd6b647b87312218737c2bf991e142cab6e75 Mon Sep 17 00:00:00 2001
From: wenyi-guo <wenyiguo@google.com>
Date: Sat, 8 Nov 2025 02:11:50 -0800
Subject: [PATCH 10/12] fix jax2tf import

---
 keras/src/utils/jax_layer.py | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/keras/src/utils/jax_layer.py b/keras/src/utils/jax_layer.py
index 7a9cb9524556..03c1742b145a 100644
--- a/keras/src/utils/jax_layer.py
+++ b/keras/src/utils/jax_layer.py
@@ -18,12 +18,9 @@
 from keras.src.utils import tracking
 from keras.src import ops
 from keras.src.utils.module_utils import jax
-from jax.experimental import jax2tf 
 from keras.src.utils.module_utils import tensorflow as tf
 
 
-
-
 def standardize_pytree_collections(pytree):
     if isinstance(pytree, collections.abc.Mapping):
         return {k: standardize_pytree_collections(v)
@@ -349,6 +346,8 @@ def get_single_jax2tf_shape(shape):
         return res
 
     def _jax2tf_convert(self, fn, polymorphic_shapes):
+        from jax.experimental import jax2tf
+
         converted_fn = jax2tf.convert(fn, polymorphic_shapes=polymorphic_shapes)
         # Autograph won't work with the output of jax2tf.
         converted_fn = tf.autograph.experimental.do_not_convert(converted_fn)

From 396a94e2c61ea9b464d785051422942e4cc26e48 Mon Sep 17 00:00:00 2001
From: wenyi-guo <wenyiguo@google.com>
Date: Sat, 8 Nov 2025 02:14:43 -0800
Subject: [PATCH 11/12] format

---
 keras/src/utils/jax_layer.py | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/keras/src/utils/jax_layer.py b/keras/src/utils/jax_layer.py
index 03c1742b145a..f16c3364c9e6 100644
--- a/keras/src/utils/jax_layer.py
+++ b/keras/src/utils/jax_layer.py
@@ -405,7 +405,11 @@ def create_variable(value):
                     dtype = None  # Use the layer dtype policy
                 return self.add_weight(
                     value.shape,
-                    initializer=backend.convert_to_tensor(value) if value is not None else None,
+                    initializer=(
+                        backend.convert_to_tensor(value)
+                        if value is not None
+                        else None
+                    ),
                     dtype=dtype,
                     trainable=trainable,
                 )

From 9d5d280548e7ace1c1addda6f3aeca04ff082eb7 Mon Sep 17 00:00:00 2001
From: wenyi-guo <wenyiguo@google.com>
Date: Mon, 10 Nov 2025 11:40:04 -0800
Subject: [PATCH 12/12] ruff format

---
 keras/src/utils/jax_layer.py      | 32 ++++++++++++++++---------------
 keras/src/utils/jax_layer_test.py |  7 ++++---
 2 files changed, 21 insertions(+), 18 deletions(-)

diff --git a/keras/src/utils/jax_layer.py b/keras/src/utils/jax_layer.py
index f16c3364c9e6..b117667ff81a 100644
--- a/keras/src/utils/jax_layer.py
+++ b/keras/src/utils/jax_layer.py
@@ -23,14 +23,13 @@
 
 def standardize_pytree_collections(pytree):
     if isinstance(pytree, collections.abc.Mapping):
-        return {k: standardize_pytree_collections(v)
-                for k, v in pytree.items()}
+        return {k: standardize_pytree_collections(v) for k, v in pytree.items()}
     elif isinstance(pytree, collections.abc.Sequence):
-        return [standardize_pytree_collections(v)
-                for v in pytree]
+        return [standardize_pytree_collections(v) for v in pytree]
     else:
         return pytree
 
+
 @keras_export("keras.layers.JaxLayer")
 class JaxLayer(Layer):
     """Keras Layer that wraps a JAX model.
@@ -275,12 +274,11 @@ def __init__(
             self.init_fn_arguments = self._validate_signature(
                 init_fn, "init_fn", {"rng", "inputs", "training"}, {"inputs"}
             )
-        
+
         # Attributes for jax2tf functions
         self.jax2tf_training_false_fn = None
         self.jax2tf_training_true_fn = None
 
-            
     def _validate_signature(self, fn, fn_name, allowed, required):
         fn_parameters = inspect.signature(fn).parameters
         for parameter_name in required:
@@ -300,7 +298,7 @@ def _validate_signature(self, fn, fn_name, allowed, required):
             parameter_names.append(parameter.name)
 
         return parameter_names
-    
+
     def _get_jax2tf_input_shape(self, input_shape):
         """Convert input shape in a format suitable for `jax2tf`.
 
@@ -480,14 +478,16 @@ def _initialize_weights(self, input_shape):
         if jax_utils.is_in_jax_tracing_scope() or tf.inside_function():
             # This exception is not actually shown, it is caught and a detailed
             # warning about calling 'build' is printed.
-            raise ValueError("'JaxLayer' cannot be built in tracing scope"
-                             "or inside tf function")
+            raise ValueError(
+                "'JaxLayer' cannot be built in tracing scope"
+                "or inside tf function"
+            )
 
         # Initialize `params` and `state` if needed by calling `init_fn`.
         def create_input(shape):
             shape = [d if d is not None else 1 for d in shape]
             return ops.ones(shape)
-        
+
         init_inputs = tree.map_shape_structure(create_input, input_shape)
         init_args = []
         for argument_name in self.init_fn_arguments:
@@ -509,7 +509,6 @@ def create_input(shape):
         )
         self.tracked_state = self._create_variables(init_state, trainable=False)
 
-                
     def build(self, input_shape):
         if self.params is None and self.state is None:
             self._initialize_weights(input_shape)
@@ -526,7 +525,9 @@ def build(self, input_shape):
                     polymorphic_shapes.append("...")
 
             if "training" in self.call_fn_arguments:
-                training_argument_index = self.call_fn_arguments.index("training")
+                training_argument_index = self.call_fn_arguments.index(
+                    "training"
+                )
                 self.jax2tf_training_false_fn = self._jax2tf_convert(
                     self._partial_with_positional(
                         self.call_fn, training_argument_index, False
@@ -546,7 +547,7 @@ def build(self, input_shape):
                 )
                 self.jax2tf_training_true_fn = None
             super().build(input_shape)
-    
+
     def call(self, inputs, training=False):
         def unwrap_variable(variable):
             return None if variable is None else variable.value
@@ -590,10 +591,12 @@ def call_with_fn(fn):
                     jax.tree_util.tree_map(
                         assign_state_to_variable,
                         standardize_pytree_collections(new_state),
-                        standardize_pytree_collections(self.state))
+                        standardize_pytree_collections(self.state),
+                    )
                 return predictions
             else:
                 return fn(*call_args)
+
         if backend.backend() == "jax":
             return call_with_fn(self.call_fn)
         elif backend.backend() == "tensorflow":
@@ -610,7 +613,6 @@ def compute_output_shape(self, input_shape):
             return self.compute_output_shape_fn(input_shape)
         else:
             return super().compute_output_shape(input_shape)
-    
 
     def get_config(self):
         config = {
diff --git a/keras/src/utils/jax_layer_test.py b/keras/src/utils/jax_layer_test.py
index 83774adcd00d..52fee536c659 100644
--- a/keras/src/utils/jax_layer_test.py
+++ b/keras/src/utils/jax_layer_test.py
@@ -204,7 +204,7 @@ def _test_layer(
         x_train = random.uniform(shape=(320, 28, 28, 1))
         y_train_indices = ops.cast(
             ops.random.uniform(shape=(320,), minval=0, maxval=num_classes),
-            dtype="int32"
+            dtype="int32",
         )
         y_train = ops.one_hot(y_train_indices, num_classes, dtype="int32")
         x_test = random.uniform(shape=(32, 28, 28, 1))
@@ -490,8 +490,9 @@ def create_wrapper(**kwargs):
             if backend.backend() == "jax":
                 return FlaxLayer(flax_model_class(), **kwargs)
             elif backend.backend() == "tensorflow":
-                return FlaxLayer(flax_model, stateless_compute_output_shape, **kwargs)
-
+                return FlaxLayer(
+                    flax_model, stateless_compute_output_shape, **kwargs
+                )
 
         self._test_layer(
             flax_model_class.__name__,