diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/__init__.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..754923c9fea548cd2deaabe06a6dd158914a77ac
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/__init__.py
@@ -0,0 +1,16 @@
+# from keras.src.ops.numpy import Matmul, matmul
+# from keras.src.ops.numpy import Add, add
+# from keras.src.ops.numpy import Multiply, multiply
+
+from keras.src.backend import cast
+from keras.src.backend import cond
+from keras.src.backend import is_tensor
+from keras.src.backend import name_scope
+from keras.src.backend import random
+from keras.src.ops import image
+from keras.src.ops import operation_utils
+from keras.src.ops.core import *  # noqa: F403
+from keras.src.ops.linalg import *  # noqa: F403
+from keras.src.ops.math import *  # noqa: F403
+from keras.src.ops.nn import *  # noqa: F403
+from keras.src.ops.numpy import *  # noqa: F403
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/__pycache__/operation_utils.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/__pycache__/operation_utils.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..a8b771131a4f12784848d99149e365fcc153c50c
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/__pycache__/operation_utils.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/__pycache__/symbolic_arguments.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/__pycache__/symbolic_arguments.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..c20e6d5f6cfd6f7cc407e669921f5af79f607db8
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/__pycache__/symbolic_arguments.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/core.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/core.py
new file mode 100644
index 0000000000000000000000000000000000000000..65fab8413425f17aa7560b1ae54f5f3a46c86050
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/core.py
@@ -0,0 +1,1167 @@
+import ml_dtypes
+import numpy as np
+
+from keras.src import backend
+from keras.src import tree
+from keras.src.api_export import keras_export
+from keras.src.backend import KerasTensor
+from keras.src.backend import any_symbolic_tensors
+from keras.src.backend.common.backend_utils import slice_along_axis
+from keras.src.ops.operation import Operation
+from keras.src.utils import traceback_utils
+
+
+class Map(Operation):
+    def __init__(self):
+        super().__init__()
+
+    def call(self, f, xs):
+        return backend.core.map(f, xs)
+
+    def compute_output_spec(self, f, xs):
+        x = xs[0]
+        n = xs.shape[0]
+        y = backend.compute_output_spec(f, x)
+
+        def append_batch_axis(x):
+            return KerasTensor(
+                shape=(n,) + x.shape, dtype=x.dtype, sparse=x.sparse
+            )
+
+        y = tree.map_structure(append_batch_axis, y)
+        return y
+
+
+@keras_export("keras.ops.map")
+def map(f, xs):
+    """Map a function over leading array axes.
+
+    Like Python’s builtin map, except inputs and outputs are in the form of
+    stacked arrays. Consider using the `vectorized_map()` transform instead,
+    unless you need to apply a function element by element for reduced memory
+    usage or heterogeneous computation with other control flow primitives.
+
+    When `xs` is an array type, the semantics of `map()` are given by this
+    Python implementation:
+
+    ```python
+    def map(f, xs):
+        return np.stack([f(x) for x in xs])
+    ```
+
+    Args:
+        f: Callable defines the function to apply element-wise over the first
+            axis or axes of `xs`.
+        xs: Values over which to map along the leading axis.
+
+    Returns:
+        Mapped values.
+
+    Examples:
+
+    >>> f = lambda x: x**2
+    >>> xs = keras.ops.arange(10)
+    >>> ys = keras.ops.map(f, xs)
+    >>> ys
+    [0, 1, 4, 9, 16, 25, 36, 49, 64, 81]
+
+    >>> f = lambda x: {"y1": x**2, "y2": x * 10}  # Can have nested outputs
+    >>> ys = keras.ops.map(f, xs)
+    >>> ys["y1"]
+    [0, 1, 4, 9, 16, 25, 36, 49, 64, 81]
+    >>> ys["y2"]
+    [0, 10, 20, 30, 40, 50, 60, 70, 80, 90]
+    """
+    if any_symbolic_tensors((xs,)):
+        return Map().symbolic_call(f, xs)
+    return backend.core.map(f, xs)
+
+
+class Scan(Operation):
+    def __init__(self, reverse=False, unroll=1):
+        super().__init__()
+        self.reverse = reverse
+        self.unroll = unroll
+
+    def call(self, f, init, xs, length):
+        return backend.core.scan(
+            f, init, xs, length, reverse=self.reverse, unroll=self.unroll
+        )
+
+    def compute_output_spec(self, f, init, xs, length):
+        if xs is None:
+            n = int(length)
+            x = None
+        else:
+            n = (
+                int(length)
+                if length is not None
+                else tree.flatten(xs)[0].shape[0]
+            )
+            x = xs[0]
+
+        carry, y = backend.compute_output_spec(f, init, x)
+        y = KerasTensor(shape=(n,) + y.shape, dtype=y.dtype, sparse=y.sparse)
+        return carry, y
+
+
+@keras_export("keras.ops.scan")
+def scan(f, init, xs=None, length=None, reverse=False, unroll=1):
+    """Scan a function over leading array axes while carrying along state.
+
+    When the type of `xs` is an array type or `None`, and the type of `ys` is an
+    array type, the semantics of `scan()` are given roughly by this Python
+    implementation:
+
+    ```python
+    def scan(f, init, xs, length=None):
+        if xs is None:
+            xs = [None] * length
+        carry = init
+        ys = []
+        for x in xs:
+            carry, y = f(carry, x)
+            ys.append(y)
+        return carry, np.stack(ys)
+    ```
+
+    The loop-carried value `carry` (`init`) must hold a fixed shape and dtype
+    across all iterations.
+
+    In TensorFlow, `y` must match `carry` in shape and dtype. This is not
+    required in other backends.
+
+    Args:
+        f: Callable defines the logic for each loop iteration. This accepts two
+            arguments where the first is a value of the loop carry and the
+            second is a slice of `xs` along its leading axis.
+            This callable returns a pair where the first represents a new value
+            for the loop carry and the second represents a slice of the output.
+        init: The initial loop carry value. This can be a scalar, tensor, or any
+            nested structure. It must match the structure of the first element
+            returned by `f`.
+        xs: Optional value to scan along its leading axis. This can be a tensor
+            or any nested structure. If `xs` is not provided, you must specify
+            `length` to define the number of loop iterations.
+            Defaults to `None`.
+        length: Optional integer specifying the number of loop iterations.
+            If `length` is not provided, it defaults to the sizes of leading
+            axis of the arrays in `xs`. Defaults to `None`.
+        reverse: Optional boolean specifying whether to run the scan iteration
+            forward or in reverse, equivalent to reversing the leading axes of
+            the arrays in both `xs` and in `ys`.
+        unroll: Optional positive integer or boolean specifying how many scan
+            iterations to unroll within a single iteration of a loop. If an
+            integer is provided, it determines how many unrolled loop iterations
+            to run within a single rolled iteration of the loop. If a boolean is
+            provided, it will determine if the loop is completely unrolled
+            (`unroll=True`) or left completely unrolled (`unroll=False`).
+            Note that unrolling is only supported by JAX and TensorFlow
+            backends.
+
+    Returns:
+        A pair where the first element represents the final loop carry value and
+        the second element represents the stacked outputs of `f` when scanned
+        over the leading axis of the inputs.
+
+    Examples:
+
+    >>> sum_fn = lambda c, x: (c + x, c + x)
+    >>> init = keras.ops.array(0)
+    >>> xs = keras.ops.array([1, 2, 3, 4, 5])
+    >>> carry, result = keras.ops.scan(sum_fn, init, xs)
+    >>> carry
+    15
+    >>> result
+    [1, 3, 6, 10, 15]
+    """
+    if any_symbolic_tensors((init, xs)):
+        return Scan(reverse=reverse, unroll=unroll).symbolic_call(
+            f, init, xs, length
+        )
+    return backend.core.scan(
+        f, init, xs, length, reverse=reverse, unroll=unroll
+    )
+
+
+class AssociativeScan(Operation):
+    def __init__(self, reverse=False):
+        super().__init__()
+        self.reverse = reverse
+
+    def call(self, f, elems, axis=0):
+        return backend.core.associative_scan(
+            f, elems, reverse=self.reverse, axis=axis
+        )
+
+    def compute_output_spec(self, f, elems, axis):
+        elems_flat = tree.flatten(elems)
+        lens = [elem.shape[axis] for elem in elems_flat]
+        if len(set(lens)) != 1:
+            raise ValueError(
+                "Array inputs to associative_scan must have the same "
+                "first dimension. (saw: {})".format(
+                    [elem.shape for elem in elems_flat]
+                )
+            )
+
+        x = tree.pack_sequence_as(
+            elems, [slice_along_axis(x, 0, 1, axis=axis) for x in elems_flat]
+        )
+        y_spec = backend.compute_output_spec(f, x, x)
+
+        def _restore_shape(x):
+            return KerasTensor(
+                shape=elems_flat[0].shape, dtype=x.dtype, sparse=x.sparse
+            )
+
+        y_spec = tree.map_structure(_restore_shape, y_spec)
+        return y_spec
+
+
+@keras_export("keras.ops.associative_scan")
+def associative_scan(f, elems, reverse=False, axis=0):
+    """Performs a scan with an associative binary operation, in parallel.
+
+    This operation his similar to `scan`, with the key difference that
+    `associative_scan` is a parallel implementation with
+    potentially significant performance benefits, especially when jit compiled.
+    The catch is that it can only be used when `f` is a binary associative
+    operation (i.e. it must verify `f(a, f(b, c)) == f(f(a, b), c)`).
+
+    For an introduction to associative scans, refer to this paper:
+    Blelloch, Guy E. 1990.
+    [Prefix Sums and Their Applications](
+        https://www.cs.cmu.edu/~guyb/papers/Ble93.pdf).
+
+    Args:
+        f: A Python callable implementing an associative binary operation with
+            signature `r = f(a, b)`. Function `f` must be associative, i.e.,
+            it must satisfy the equation
+            `f(a, f(b, c)) == f(f(a, b), c)`.
+            The inputs and result are (possibly nested Python tree structures
+            of) array(s) matching `elems`. Each array has a dimension in place
+            of the `axis` dimension. `f` should be applied elementwise over
+            the `axis` dimension.
+            The result `r` has the same shape (and structure) as the
+            two inputs `a` and `b`.
+        elems: A (possibly nested Python tree structure of) array(s), each with
+            an `axis` dimension of size `num_elems`.
+        reverse: A boolean stating if the scan should be reversed with respect
+            to the `axis` dimension.
+        axis: an integer identifying the axis over which the scan should occur.
+
+    Returns:
+        A (possibly nested Python tree structure of) array(s) of the same shape
+        and structure as `elems`, in which the `k`'th element of `axis` is
+        the result of recursively applying `f` to combine the first `k`
+        elements of `elems` along `axis`. For example, given
+        `elems = [a, b, c, ...]`, the result would be
+        `[a, f(a, b), f(f(a, b), c), ...]`.
+
+    Examples:
+
+    >>> sum_fn = lambda x, y: x + y
+    >>> xs = keras.ops.arange(5)
+    >>> ys = keras.ops.associative_scan(sum_fn, xs, axis=0)
+    >>> ys
+    [0, 1, 3, 6, 10]
+
+    >>> sum_fn = lambda x, y: [x[0] + y[0], x[1] + y[1], x[2] + y[2]]
+    >>> xs = [keras.ops.array([[1, 2]]) for _ in range(3)]
+    >>> ys = keras.ops.associative_scan(sum_fn, xs, axis=0)
+    >>> ys
+    [[1, 3], [1, 3], [1, 3]]
+    """
+    if any_symbolic_tensors((elems,)):
+        return AssociativeScan(reverse=reverse).symbolic_call(f, elems, axis)
+    return backend.core.associative_scan(f, elems, reverse=reverse, axis=axis)
+
+
+class Scatter(Operation):
+    def call(self, indices, values, shape):
+        return backend.core.scatter(indices, values, shape)
+
+    def compute_output_spec(self, indices, values, shape):
+        return KerasTensor(shape, dtype=values.dtype)
+
+
+@keras_export("keras.ops.scatter")
+def scatter(indices, values, shape):
+    """Returns a tensor of shape `shape` where `indices` are set to `values`.
+
+    At a high level, this operation does `zeros[indices] = updates` and
+    returns the output. It is equivalent to:
+
+    ```python
+    zeros = keras.ops.zeros(shape)
+    output = keras.ops.scatter_update(zeros, indices, values)
+    ```
+
+    Args:
+        indices: A tensor or list/tuple specifying
+            indices for the values in `values`.
+        values: A tensor, the values to be set at `indices`.
+        shape: Shape of the output tensor.
+
+    Example:
+
+    >>> indices = [[0, 1], [1, 1]]
+    >>> values = np.array([1., 1.])
+    >>> keras.ops.scatter(indices, values, shape=(2, 2))
+    array([[0., 1.],
+           [0., 1.]])
+    """
+    if any_symbolic_tensors((indices, values, shape)):
+        return Scatter().symbolic_call(indices, values, shape)
+    return backend.core.scatter(indices, values, shape)
+
+
+class ScatterUpdate(Operation):
+    def call(self, inputs, indices, updates):
+        return backend.core.scatter_update(inputs, indices, updates)
+
+    def compute_output_spec(self, inputs, indices, updates):
+        return KerasTensor(inputs.shape, dtype=inputs.dtype)
+
+
+@keras_export("keras.ops.scatter_update")
+def scatter_update(inputs, indices, updates):
+    """Update inputs via updates at scattered (sparse) indices.
+
+    At a high level, this operation does `inputs[indices] = updates`.
+    Assume `inputs` is a tensor of shape `(D0, D1, ..., Dn)`, there are 2 main
+    usages of `scatter_update`.
+
+    1. `indices` is a 2D tensor of shape `(num_updates, n)`, where `num_updates`
+        is the number of updates to perform, and `updates` is a 1D tensor of
+        shape `(num_updates,)`. For example, if `inputs` is `zeros((4, 4, 4))`,
+        and we want to update `inputs[1, 2, 3]` and `inputs[0, 1, 3]` as 1, then
+        we can use:
+
+    ```python
+    inputs = np.zeros((4, 4, 4))
+    indices = [[1, 2, 3], [0, 1, 3]]
+    updates = np.array([1., 1.])
+    inputs = keras.ops.scatter_update(inputs, indices, updates)
+    ```
+
+    2 `indices` is a 2D tensor of shape `(num_updates, k)`, where `num_updates`
+        is the number of updates to perform, and `k` (`k < n`) is the size of
+        each index in `indices`. `updates` is a `n - k`-D tensor of shape
+        `(num_updates, inputs.shape[k:])`. For example, if
+        `inputs = np.zeros((4, 4, 4))`, and we want to update `inputs[1, 2, :]`
+        and `inputs[2, 3, :]` as `[1, 1, 1, 1]`, then `indices` would have shape
+        `(num_updates, 2)` (`k = 2`), and `updates` would have shape
+        `(num_updates, 4)` (`inputs.shape[2:] = 4`). See the code below:
+
+    ```python
+    inputs = np.zeros((4, 4, 4))
+    indices = [[1, 2], [2, 3]]
+    updates = np.array([[1., 1., 1, 1,], [1., 1., 1, 1,])
+    inputs = keras.ops.scatter_update(inputs, indices, updates)
+    ```
+
+    Args:
+        inputs: A tensor, the tensor to be updated.
+        indices: A tensor or list/tuple of shape `(N, inputs.ndim)`, specifying
+            indices to update. `N` is the number of indices to update, must be
+            equal to the first dimension of `updates`.
+        updates: A tensor, the new values to be put to `inputs` at `indices`.
+
+    Returns:
+        A tensor, has the same shape and dtype as `inputs`.
+    """
+    if any_symbolic_tensors((inputs, indices, updates)):
+        return ScatterUpdate().symbolic_call(inputs, indices, updates)
+    return backend.core.scatter_update(inputs, indices, updates)
+
+
+class Slice(Operation):
+    def call(self, inputs, start_indices, shape):
+        return backend.core.slice(inputs, start_indices, shape)
+
+    def compute_output_spec(self, inputs, start_indices, shape):
+        return KerasTensor(shape, dtype=inputs.dtype)
+
+
+@keras_export("keras.ops.slice")
+def slice(inputs, start_indices, shape):
+    """Return a slice of an input tensor.
+
+    At a high level, this operation is an explicit replacement for array slicing
+    e.g. `inputs[start_indices: start_indices + shape]`.
+    Unlike slicing via brackets, this operation will accept tensor start
+    indices on all backends, which is useful when indices dynamically computed
+    via other tensor operations.
+
+    ```python
+    inputs = np.zeros((5, 5))
+    start_indices = np.array([3, 3])
+    shape = np.array([2, 2])
+    inputs = keras.ops.slice(inputs, start_indices, shape)
+    ```
+
+    Args:
+        inputs: A tensor, the tensor to be updated.
+        start_indices: A list/tuple of shape `(inputs.ndim,)`, specifying
+            the starting indices for updating.
+        shape: The full shape of the returned slice.
+
+    Returns:
+        A tensor, has the same shape and dtype as `inputs`.
+    """
+    if any_symbolic_tensors((inputs, start_indices, shape)):
+        return Slice().symbolic_call(inputs, start_indices, shape)
+    return backend.core.slice(inputs, start_indices, shape)
+
+
+class SliceUpdate(Operation):
+    def call(self, inputs, start_indices, updates):
+        return backend.core.slice_update(inputs, start_indices, updates)
+
+    def compute_output_spec(self, inputs, start_indices, updates):
+        return KerasTensor(inputs.shape, dtype=inputs.dtype)
+
+
+@keras_export("keras.ops.slice_update")
+def slice_update(inputs, start_indices, updates):
+    """Update an input by slicing in a tensor of updated values.
+
+    At a high level, this operation does
+    `inputs[start_indices: start_indices + updates.shape] = updates`.
+    Assume inputs is a tensor of shape `(D0, D1, ..., Dn)`,
+    `start_indices` must be a list/tuple of n integers, specifying the starting
+    indices. `updates` must have the same rank as `inputs`, and the size of each
+    dim must not exceed `Di - start_indices[i]`. For example, if we have 2D
+    inputs `inputs = np.zeros((5, 5))`, and we want to update the intersection
+    of last 2 rows and last 2 columns as 1, i.e.,
+    `inputs[3:, 3:] = np.ones((2, 2))`, then we can use the code below:
+
+    ```python
+    inputs = np.zeros((5, 5))
+    start_indices = [3, 3]
+    updates = np.ones((2, 2))
+    inputs = keras.ops.slice_update(inputs, start_indices, updates)
+    ```
+
+    Args:
+        inputs: A tensor, the tensor to be updated.
+        start_indices: A list/tuple of shape `(inputs.ndim,)`, specifying
+            the starting indices for updating.
+        updates: A tensor, the new values to be put to `inputs` at `indices`.
+            `updates` must have the same rank as `inputs`.
+
+    Returns:
+        A tensor, has the same shape and dtype as `inputs`.
+    """
+    if any_symbolic_tensors((inputs, start_indices, updates)):
+        return SliceUpdate().symbolic_call(inputs, start_indices, updates)
+    return backend.core.slice_update(inputs, start_indices, updates)
+
+
+class Switch(Operation):
+    def call(self, index, branches, *operands):
+        return backend.core.switch(index, branches, *operands)
+
+    def compute_output_spec(self, index, branches, *operands):
+        # We use first branch for output_spec
+        spec = backend.compute_output_spec(branches[0], *operands)
+        return spec
+
+
+@keras_export("keras.ops.switch")
+def switch(index, branches, *operands):
+    """Apply exactly one of the `branches` given by `index`.
+
+    If `index` is out of bounds, it is clamped to within bounds.
+
+    The semantics of `switch` are given roughly by this Python implementation:
+
+    ```python
+    def switch(index, branches, *operands):
+        index = clamp(0, index, len(branches) - 1)
+        return branches[index](*operands)
+    ```
+
+    Args:
+        index: An integer scalar indicating which branch function to apply.
+        branches: A sequence of functions to be applied based on `index`.
+        operands: Inputs to whichever branch is applied.
+
+    Returns:
+        The outputs of `branch(*operands)` for the branch that was selected
+        based on `index`.
+
+    Examples:
+
+    >>> add_fn = lambda x, y: x + y
+    >>> subtract_fn = lambda x, y: x - y
+    >>> x = keras.ops.array(2.0)
+    >>> y = keras.ops.array(0.5)
+    >>> branches = [add_fn, subtract_fn]
+    >>> keras.ops.switch(0, branches, x, y)
+    2.5
+
+    >>> keras.ops.switch(1, branches, x, y)
+    1.5
+    """
+    if any_symbolic_tensors(operands):
+        return Switch().symbolic_call(index, branches, *operands)
+    return backend.core.switch(index, branches, *operands)
+
+
+class WhileLoop(Operation):
+    def __init__(self, cond, body, maximum_iterations):
+        super().__init__()
+        self.cond = cond
+        self.body = body
+        self.maximum_iterations = maximum_iterations
+
+    def call(self, loop_vars):
+        return backend.core.while_loop(
+            self.cond,
+            self.body,
+            loop_vars,
+            maximum_iterations=self.maximum_iterations,
+        )
+
+    def compute_output_spec(self, loop_vars):
+        return [KerasTensor(v.shape, dtype=v.dtype) for v in loop_vars]
+
+
+@keras_export("keras.ops.while_loop")
+def while_loop(
+    cond,
+    body,
+    loop_vars,
+    maximum_iterations=None,
+):
+    """While loop implementation.
+
+    Args:
+        cond: A callable that represents the termination condition of the loop.
+            Must accept a `loop_vars` like structure as an argument. If
+            `loop_vars` is a tuple or list, each element of `loop_vars` will be
+            passed positionally to the callable.
+        body: A callable that represents the loop body. Must accept a
+            `loop_vars` like structure as an argument, and return update value
+            with the same structure. If `loop_vars` is a tuple or list, each
+            element of `loop_vars` will be passed positionally to the callable.
+        loop_vars: An arbitrary nested structure of tensor state to persist
+            across loop iterations.
+        maximum_iterations: Optional maximum number of iterations of the while
+            loop to run. If provided, the `cond` output is AND-ed with an
+            additional condition ensuring the number of iterations executed is
+            no greater than `maximum_iterations`.
+
+    Returns:
+        A list/tuple of tensors, has the same shape and dtype as `inputs`.
+
+    Examples:
+
+    >>> i = 0
+    >>> cond = lambda i: i < 10
+    >>> body = lambda i: i + 1
+    >>> keras.ops.while_loop(cond, body, i)
+    10
+
+    >>> x, y = 0, 1
+    >>> cond = lambda x, y: x < 10
+    >>> body = lambda x, y: (x + 1, y + 1)
+    >>> keras.ops.while_loop(cond, body, (x, y))
+    10, 11
+    """
+    return backend.core.while_loop(
+        cond,
+        body,
+        loop_vars,
+        maximum_iterations=maximum_iterations,
+    )
+
+
+class StopGradient(Operation):
+    def __init__(self):
+        super().__init__()
+
+    def call(self, variable):
+        return backend.core.stop_gradient(variable)
+
+    def compute_output_spec(self, variable):
+        return KerasTensor(variable.shape, dtype=variable.dtype)
+
+
+@keras_export("keras.ops.stop_gradient")
+def stop_gradient(variable):
+    """Stops gradient computation.
+
+    Args:
+        variable: A tensor variable for which the gradient
+            computation is to be disabled.
+
+    Returns:
+        The variable with gradient computation disabled.
+
+    Examples:
+
+    >>> var = keras.backend.convert_to_tensor(
+    ...     [1., 2., 3.],
+    ...     dtype="float32"
+    ... )
+    >>> var = keras.ops.stop_gradient(var)
+    """
+    if any_symbolic_tensors((variable,)):
+        return StopGradient().symbolic_call(variable)
+    return backend.core.stop_gradient(variable)
+
+
+class ForiLoop(Operation):
+    def __init__(self, lower, upper, body_fun):
+        super().__init__()
+        self.lower = lower
+        self.upper = upper
+        self.body_fun = body_fun
+
+    def call(self, init_val):
+        return backend.core.fori_loop(
+            self.lower,
+            self.upper,
+            self.body_fun,
+            init_val,
+        )
+
+    def compute_output_spec(self, init_val):
+        return KerasTensor(init_val.shape, dtype=init_val.dtype)
+
+
+@keras_export("keras.ops.fori_loop")
+def fori_loop(lower, upper, body_fun, init_val):
+    """For loop implementation.
+
+    Args:
+        lower: The initial value of the loop variable.
+        upper: The upper bound of the loop variable.
+        body_fun: A callable that represents the loop body. Must take two
+            arguments: the loop variable and the loop state. The loop state
+            should be updated and returned by this function.
+        init_val: The initial value of the loop state.
+
+    Returns:
+        The final state after the loop.
+
+    Example:
+
+    >>> lower = 0
+    >>> upper = 10
+    >>> body_fun = lambda i, s: (i + 1, s + i)
+    >>> init_val = 0
+    >>> keras.ops.fori_loop(lower, upper, body_fun, init_val)
+    45
+    """
+    if any_symbolic_tensors((lower, upper, init_val)):
+        return ForiLoop(lower, upper, body_fun).symbolic_call(init_val)
+    return backend.core.fori_loop(lower, upper, body_fun, init_val)
+
+
+class Unstack(Operation):
+    def __init__(self, num=None, axis=0):
+        super().__init__()
+        self.num = num
+        self.axis = axis
+
+    def call(self, x):
+        return backend.core.unstack(x, self.num, self.axis)
+
+    def compute_output_spec(self, x):
+        axis = self.axis
+        if axis < 0:
+            axis = len(x.shape) + axis
+        output_shapes = x.shape[:axis] + x.shape[axis + 1 :]
+        num = self.num
+        if num is None:
+            num = x.shape[axis]
+        if num is None:
+            raise ValueError(
+                "Cannot infer argument `num` from shape "
+                f"{x.shape}. Either provide a tensor with a "
+                "concrete shape in the `axis` dimension or "
+                "explicitly pass the `num` argument."
+            )
+        output = [
+            KerasTensor(shape=output_shapes, dtype=x.dtype) for _ in range(num)
+        ]
+        return output
+
+
+@keras_export("keras.ops.unstack")
+def unstack(x, num=None, axis=0):
+    """Unpacks the given dimension of a rank-R tensor into rank-(R-1) tensors.
+
+    Args:
+        x: The input tensor.
+        num: The length of the dimension axis. Automatically inferred
+            if `None`.
+        axis: The axis along which to unpack.
+
+    Returns:
+        A list of tensors unpacked along the given axis.
+
+    Example:
+
+    >>> x = keras.ops.array([[1, 2], [3, 4]])
+    >>> keras.ops.unstack(x, axis=0)
+    [array([1, 2]), array([3, 4])]
+    """
+    if any_symbolic_tensors((x,)):
+        return Unstack(num, axis).symbolic_call(x)
+    return backend.core.unstack(x, num=num, axis=axis)
+
+
+@keras_export("keras.ops.shape")
+def shape(x):
+    """Gets the shape of the tensor input.
+
+    Note: On the TensorFlow backend, when `x` is a `tf.Tensor` with dynamic
+    shape, dimensions which are dynamic in the context of a compiled function
+    will have a `tf.Tensor` value instead of a static integer value.
+
+    Args:
+        x: A tensor. This function will try to access the `shape` attribute of
+            the input tensor.
+
+    Returns:
+        A tuple of integers or None values, indicating the shape of the input
+            tensor.
+
+    Example:
+
+    >>> x = keras.ops.zeros((8, 12))
+    >>> keras.ops.shape(x)
+    (8, 12)
+    """
+    if any_symbolic_tensors((x,)):
+        return x.shape
+    return backend.core.shape(x)
+
+
+@keras_export("keras.ops.dtype")
+def dtype(x):
+    """Return the dtype of the tensor input as a standardized string.
+
+    Note that due to the standardization, the dtype will not compare equal
+    to the backend-specific version of the dtype.
+
+    Args:
+        x: A tensor. This function will try to access the `dtype` attribute of
+            the input tensor.
+
+    Returns:
+        A string indicating the dtype of the input tensor, e.g. `"float32"`.
+
+    Example:
+
+    >>> x = keras.ops.zeros((8, 12))
+    >>> keras.ops.dtype(x)
+    'float32'
+
+    """
+    return backend.standardize_dtype(x.dtype)
+
+
+class Cast(Operation):
+    def __init__(self, dtype):
+        super().__init__()
+        self.dtype = backend.standardize_dtype(dtype)
+
+    def call(self, x):
+        return backend.core.cast(x, self.dtype)
+
+    def compute_output_spec(self, x):
+        return backend.KerasTensor(shape=x.shape, dtype=self.dtype)
+
+
+@keras_export("keras.ops.cast")
+def cast(x, dtype):
+    """Cast a tensor to the desired dtype.
+
+    Args:
+        x: A tensor or variable.
+        dtype: The target type.
+
+    Returns:
+        A tensor of the specified `dtype`.
+
+    Example:
+
+    >>> x = keras.ops.arange(4)
+    >>> x = keras.ops.cast(x, dtype="float16")
+    """
+    dtype = backend.standardize_dtype(dtype)
+
+    if any_symbolic_tensors((x,)):
+        return Cast(dtype=dtype)(x)
+    return backend.core.cast(x, dtype)
+
+
+class SaturateCast(Operation):
+    def __init__(self, dtype):
+        super().__init__()
+        self.dtype = backend.standardize_dtype(dtype)
+
+    def call(self, x):
+        return _saturate_cast(x, self.dtype)
+
+    def compute_output_spec(self, x):
+        return backend.KerasTensor(shape=x.shape, dtype=self.dtype)
+
+
+@keras_export("keras.ops.saturate_cast")
+def saturate_cast(x, dtype):
+    """Performs a safe saturating cast to the desired dtype.
+
+    Saturating cast prevents data type overflow when casting to `dtype` with
+    smaller values range. E.g.
+    `ops.cast(ops.cast([-1, 256], "float32"), "uint8")` returns `[255, 0]`,
+    but `ops.saturate_cast(ops.cast([-1, 256], "float32"), "uint8")` returns
+    `[0, 255]`.
+
+    Args:
+        x: A tensor or variable.
+        dtype: The target type.
+
+    Returns:
+        A safely casted tensor of the specified `dtype`.
+
+    Example:
+
+    Image resizing with bicubic interpolation may produce values outside
+    original range.
+    >>> image2x2 = np.array([0, 1, 254, 255], dtype="uint8").reshape(1, 2, 2, 1)
+    >>> image4x4 = tf.image.resize(image2x2, (4, 4), method="bicubic")
+    >>> print(image4x4.numpy().squeeze())
+    >>> # [[-22.500004 -22.204624 -21.618908 -21.32353 ]
+    >>> #  [ 52.526054  52.82143   53.407146  53.70253 ]
+    >>> #  [201.29752  201.59288  202.17859  202.47395 ]
+    >>> #  [276.32355  276.61893  277.20465  277.50006 ]]
+
+    Casting this resized image back to `uint8` will cause overflow.
+    >>> image4x4_casted = ops.cast(image4x4, "uint8")
+    >>> print(image4x4_casted.numpy().squeeze())
+    >>> # [[234 234 235 235]
+    >>> #  [ 52  52  53  53]
+    >>> #  [201 201 202 202]
+    >>> #  [ 20  20  21  21]]
+
+    Saturate casting to `uint8` will clip values to `uint8` range before
+    casting and will not cause overflow.
+    >>> image4x4_saturate_casted = ops.saturate_cast(image4x4, "uint8")
+    >>> print(image4x4_saturate_casted.numpy().squeeze())
+    >>> # [[  0   0   0   0]
+    >>> #  [ 52  52  53  53]
+    >>> #  [201 201 202 202]
+    >>> #  [255 255 255 255]]
+
+    """
+    dtype = backend.standardize_dtype(dtype)
+
+    if any_symbolic_tensors((x,)):
+        return SaturateCast(dtype=dtype)(x)
+    return _saturate_cast(x, dtype)
+
+
+def _saturate_cast(x, dtype, backend_module=None):
+    backend_module = backend_module or backend
+
+    def get_dtype_min_max(dtype):
+        if "bool" == dtype:
+            dtype_min = 0
+            dtype_max = 1
+        elif "int" in dtype:
+            dtype_min = ml_dtypes.iinfo(dtype).min
+            dtype_max = ml_dtypes.iinfo(dtype).max
+        else:
+            dtype_min = ml_dtypes.finfo(dtype).min
+            dtype_max = ml_dtypes.finfo(dtype).max
+        return dtype_min, dtype_max
+
+    dtype = backend.standardize_dtype(dtype)
+    in_dtype = backend.standardize_dtype(x.dtype)
+    in_min, in_max = get_dtype_min_max(in_dtype)
+    out_min, out_max = get_dtype_min_max(dtype)
+
+    # The output min/max may not actually be representable in the
+    # in_dtype (e.g. casting float32 to uint32).  This can lead to undefined
+    # behavior when trying to cast a value outside the valid range of the
+    # target type. We work around this by nudging the min/max to fall within
+    # the valid output range. The catch is that we may actually saturate
+    # to a value less than the true saturation limit, but this is the best we
+    # can do in order to avoid UB without backend op.
+    min_limit = np.maximum(in_min, out_min).astype(in_dtype)
+    if min_limit < out_min:
+        min_limit = np.nextafter(min_limit, 0, dtype=in_dtype)
+    max_limit = np.minimum(in_max, out_max).astype(in_dtype)
+    if max_limit > out_max:
+        max_limit = np.nextafter(max_limit, 0, dtype=in_dtype)
+
+    # Unconditionally apply `clip` to fix `inf` behavior.
+    x = backend_module.numpy.clip(x, min_limit, max_limit)
+
+    return backend_module.cast(x, dtype)
+
+
+class ConvertToTensor(Operation):
+    def __init__(self, dtype, sparse):
+        super().__init__()
+        self.dtype = backend.standardize_dtype(dtype)
+        self.sparse = sparse
+
+    def call(self, x):
+        return backend.core.convert_to_tensor(
+            x, dtype=self.dtype, sparse=self.sparse
+        )
+
+    def compute_output_spec(self, x):
+        dtype = x.dtype if self.dtype is None else self.dtype
+        sparse = (
+            False if self.sparse is not None and not self.sparse else x.sparse
+        )
+        return backend.KerasTensor(shape=x.shape, dtype=dtype, sparse=sparse)
+
+
+@keras_export("keras.ops.convert_to_tensor")
+def convert_to_tensor(x, dtype=None, sparse=None):
+    """Convert a NumPy array to a tensor.
+
+    Args:
+        x: A NumPy array, Python array (can be nested) or a backend tensor.
+        dtype: The target type. If `None`, the type of `x` is used.
+        sparse: Whether to keep sparse tensors. `False` will cause sparse
+            tensors to be densified. The default value of `None` means that
+            sparse tensors are kept only if the backend supports them.
+
+    Returns:
+        A backend tensor of the specified `dtype` and sparseness.
+
+    Example:
+
+    >>> x = np.array([1, 2, 3])
+    >>> y = keras.ops.convert_to_tensor(x)
+    """
+    if any_symbolic_tensors((x,)):
+        return ConvertToTensor(dtype=dtype, sparse=sparse)(x)
+    return backend.core.convert_to_tensor(x, dtype=dtype, sparse=sparse)
+
+
+@keras_export("keras.ops.convert_to_numpy")
+def convert_to_numpy(x):
+    """Convert a tensor to a NumPy array.
+
+    Args:
+        x: A tensor.
+
+    Returns:
+        A NumPy array.
+    """
+    if any_symbolic_tensors((x,)):
+        # This will raise a `ValueError` defined in the `KerasTensor` class.
+        # We trigger it rather than duplicate it here.
+        return np.array(x)
+    return backend.convert_to_numpy(x)
+
+
+class Cond(Operation):
+    @traceback_utils.filter_traceback
+    def __call__(self, *args, **kwargs):
+        def call_fn(*args, **kwargs):
+            if any_symbolic_tensors(args, kwargs):
+                return self.symbolic_call(*args, **kwargs)
+            else:
+                return self.call(*args, **kwargs)
+
+        if traceback_utils.is_traceback_filtering_enabled():
+            # Wrap self.call to provide helpful info in case of exception
+            call_fn = traceback_utils.inject_argument_info_in_traceback(
+                call_fn,
+                object_name=(f"{self.__class__.__name__}.call()"),
+            )
+            return call_fn(*args, **kwargs)
+
+        # Plain flow.
+        return call_fn(*args, **kwargs)
+
+    def call(self, pred, true_fn, false_fn):
+        return backend.core.cond(pred, true_fn, false_fn)
+
+    def compute_output_spec(self, pred, true_fn, false_fn):
+        true_fn_spec = backend.compute_output_spec(true_fn)
+        false_fn_spec = backend.compute_output_spec(false_fn)
+        if not self._check_output_spec(true_fn_spec, false_fn_spec):
+            raise ValueError(
+                "`true_fn` and `false_fn` should return outputs "
+                "of the same kind (struct, dtype and shape). "
+                f"Got {true_fn_spec} and {false_fn_spec} instead."
+            )
+        return true_fn_spec
+
+    def _check_output_spec(self, true_fn_spec, false_fn_spec):
+        try:
+            tree.assert_same_structure(true_fn_spec, false_fn_spec)
+        except:
+            return False
+
+        def check_leaf(t_spec, f_spec):
+            if t_spec is None or f_spec is None:
+                return t_spec is None and f_spec is None
+            return t_spec.shape == f_spec.shape and t_spec.dtype == f_spec.dtype
+
+        same = tree.map_structure(check_leaf, true_fn_spec, false_fn_spec)
+        return all(tree.flatten(same))
+
+
+@keras_export("keras.ops.cond")
+def cond(pred, true_fn, false_fn):
+    """Conditionally applies `true_fn` or `false_fn`.
+
+    Args:
+        pred: Boolean scalar type
+        true_fn: Callable returning the output for the `pred == True` case.
+        false_fn: Callable returning the output for the `pred == False` case.
+
+    Returns:
+        The output of either `true_fn` or `false_fn` depending on pred.
+    """
+    return Cond()(pred, true_fn, false_fn)
+
+
+# TODO: also create an Op subclass VectorizedMap.
+@keras_export("keras.ops.vectorized_map")
+def vectorized_map(function, elements):
+    """Parallel map of `function` on axis 0 of tensor(s) `elements`.
+
+    Schematically, `vectorized_map` implements the following,
+    in the case of a single tensor input `elements`:
+
+    ```python
+    def vectorized_map(function, elements)
+        outputs = []
+        for e in elements:
+            outputs.append(function(e))
+        return stack(outputs)
+    ```
+
+    In the case of an iterable of tensors `elements`,
+    it implements the following:
+
+    ```python
+    def vectorized_map(function, elements)
+        batch_size = elements[0].shape[0]
+        outputs = []
+        for index in range(batch_size):
+            outputs.append(function([e[index] for e in elements]))
+        return np.stack(outputs)
+    ```
+
+    In this case, `function` is expected to take as input
+    a single list of tensor arguments.
+    """
+    return backend.core.vectorized_map(function, elements)
+
+
+@keras_export("keras.ops.is_tensor")
+def is_tensor(x):
+    """Check whether the given object is a tensor.
+
+    Note: This checks for backend specific tensors so passing a TensorFlow
+    tensor would return `False` if your backend is PyTorch or JAX.
+
+    Args:
+        x: A variable.
+
+    Returns:
+        `True` if `x` is a tensor, otherwise `False`.
+    """
+    return backend.core.is_tensor(x)
+
+
+@keras_export("keras.ops.custom_gradient")
+def custom_gradient(f):
+    """Decorator to define a function with a custom gradient.
+
+    This decorator allows fine grained control over the gradients of a sequence
+    for operations. This may be useful for multiple reasons, including providing
+    a more efficient or numerically stable gradient for a sequence of
+    operations.
+
+    Args:
+        f: Function `f(*args)` that returns a tuple
+            `(output, grad_fn)`, where:
+            - `args` is a sequence of (nested structures of) tensor inputs to
+                the function.
+            - `output` is a (nested structure of) tensor outputs of applying
+                operations in `forward_fn` to `args`.
+            - `grad_fn` is a function with the signature `grad_fn(*args,
+                upstream)` which returns a tuple of tensors the same size as
+                (flattened) `args`: the derivatives of tensors in `output` with
+                respect to the tensors in `args`. `upstream` is a tensor or
+                sequence of tensors holding the initial value gradients for each
+                tensor in `output`.
+
+    Returns:
+        A function `h(*args)` which returns the same value as
+        `f(*args)[0]` and whose gradient is determined by
+        `f(*args)[1]`.
+
+
+    Examples:
+
+    1. Backend-agnostic example.
+
+    ```python
+    @ops.custom_gradient
+    def log1pexp(x):
+        e = ops.exp(x)
+
+        def grad(*args, upstream=None):
+            if upstream is None:
+                (upstream,) = args
+            return ops.multiply(upstream, 1.0 - 1.0 / ops.add(1, e))
+
+        return ops.log(1 + e), grad
+    ```
+
+    Note that the grad function that returns gradient computation
+    requires `args` as well as an `upstream` keyword argument, depending
+    on the backend being set. With the JAX and TensorFlow backends,
+    it requires only one argument, whereas it might use the `upstream`
+    argument in the case of the PyTorch backend.
+
+    When working with TensorFlow/JAX backend, `grad(upstream)`
+    is sufficient. With PyTorch, the `grad` function requires
+    `*args` as well as `upstream`, e.g. `def grad(*args, upstream)`.
+    Follow the previous example to use `@ops.custom_gradient` in
+    a way that is compatible with all backends.
+
+    2. Here's JAX & TensorFlow-specific example:
+
+    ```python
+    @ops.custom_gradient
+    def log1pexp(x):
+        e = ops.exp(x)
+        def grad(upstream):
+            return ops.multiply(upstream, 1.0 - 1.0 / ops.add(1, e))
+        return ops.log(1 + e), grad
+    ```
+
+    3. Lastly, here's a PyTorch-specific example,
+    using `*args` & `upstream`:
+
+    ```python
+    @ops.custom_gradient
+    def log1pexp(x):
+        e = ops.exp(x)
+        def grad(*args, upstream):
+            return ops.multiply(upstream, 1.0 - 1.0 / ops.add(1, e))
+        return ops.log(1 + e), grad
+    ```
+    """
+    return backend.core.custom_gradient(f)
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/function.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/function.py
new file mode 100644
index 0000000000000000000000000000000000000000..d8a5c8d4f25150fa4cbe209ce10d40e41ef27808
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/function.py
@@ -0,0 +1,423 @@
+import collections
+
+from keras.src import tree
+from keras.src.api_export import keras_export
+from keras.src.backend import KerasTensor
+from keras.src.backend.config import backend
+from keras.src.ops.operation import Operation
+
+
+@keras_export("keras.Function")
+class Function(Operation):
+    """Class that encapsulates a computation graph of Keras operations.
+
+    You can use a `Function` to capture the computation graph linking
+    some input tensors to some output tensors, and reapply the same
+    computation on new inputs.
+
+    A `Function` is similar to a Functional Model, with the difference
+    that it is stateless (it does not track state variables)
+    and does not implement the `Layer` API.
+
+    Example:
+
+    ```python
+    input_1 = keras.KerasTensor(shape=(None, 2, 3))
+    input_2 = keras.KerasTensor(shape=(None, 2, 3))
+    x = input_1 + input_2
+    output = keras.ops.sigmoid(x)
+    fn = keras.Function(inputs=[input_1, input_2], outputs=output)
+
+    input_1_val = np.random.random((4, 2, 3))
+    input_2_val = np.random.random((4, 2, 3))
+    output_val = fn([input_1_val, input_2_val])
+    ```
+
+    Args:
+        inputs: `KerasTensor` instance or nested structured of
+            `KerasTensor` instances.
+        outputs: `KerasTensor` instance or nested structured of
+            `KerasTensor` instances. They should be computable
+            given only the values of `inputs`.
+        name: String. The name of the function.
+    """
+
+    def __init__(self, inputs, outputs, name=None):
+        super().__init__(name=name)
+
+        if backend() == "tensorflow":
+            # Temporary work around for
+            # https://github.com/keras-team/keras/issues/931
+            # This stop tensorflow from wrapping tf.function output in a
+            # _DictWrapper object.
+            _self_setattr_tracking = getattr(
+                self, "_self_setattr_tracking", True
+            )
+            self._self_setattr_tracking = False
+        self._inputs_struct = tree.map_structure(lambda x: x, inputs)
+        self._outputs_struct = tree.map_structure(lambda x: x, outputs)
+        self._inputs = tree.flatten(inputs)
+        self._outputs = tree.flatten(outputs)
+        if not self._inputs:
+            raise ValueError(
+                "`inputs` argument cannot be empty. Received:\n"
+                f"inputs={inputs}\n"
+                f"outputs={outputs}"
+            )
+        if not self._outputs:
+            raise ValueError(
+                "`outputs` argument cannot be empty. Received:\n"
+                f"inputs={inputs}\n"
+                f"outputs={outputs}"
+            )
+
+        if backend() == "tensorflow":
+            self._self_setattr_tracking = _self_setattr_tracking
+
+        (nodes, nodes_by_depth, operations, operations_by_depth) = map_graph(
+            self._inputs, self._outputs
+        )
+        self._nodes = nodes
+        self._nodes_by_depth = nodes_by_depth
+        self._operations = operations
+        self._operations_by_depth = operations_by_depth
+
+    @property
+    def operations(self):
+        return self._operations[:]
+
+    @property
+    def inputs(self):
+        """Flat list of the symbolic inputs of the Function."""
+        return self._inputs
+
+    @property
+    def outputs(self):
+        """Flat list of the symbolic outputs of the Function."""
+        return self._outputs
+
+    def compute_output_spec(self, inputs):
+        self._assert_input_compatibility(inputs)
+        # Check if input shapes are identical to ref input shapes,
+        # if so take a shortcut.
+        shortcut = True
+        for x, x_ref in zip(tree.flatten(inputs), self._inputs):
+            if x.shape != x_ref.shape:
+                shortcut = False
+                break
+        if shortcut:
+            return tree.map_structure(
+                lambda x: KerasTensor(shape=x.shape, dtype=x.dtype),
+                self._outputs_struct,
+            )
+        # No luck; take the long road through the graph.
+        # Original Keras used a cache to avoid recomputing all this
+        # when known input shapes where seen again. Perhaps a good
+        # idea to bring that back.
+        return self._run_through_graph(
+            inputs, operation_fn=lambda op: op.compute_output_spec
+        )
+
+    def compute_output_shape(self, input_shape):
+        # Wrap `input_shape` into the structure of KerasTensor to utilize
+        # `compute_output_spec`.
+        input_shape_struct = tree.map_shape_structure(
+            lambda x: KerasTensor(shape=x), input_shape
+        )
+        # Ensure that dtype and sparse settings are the same as self._inputs,
+        # because we only care about the shape in this function.
+        for x, x_ref in zip(tree.flatten(input_shape_struct), self._inputs):
+            x._dtype = x_ref.dtype
+            x._sparse = x_ref.sparse
+        output_spec = self.compute_output_spec(input_shape_struct)
+        return tree.map_structure(lambda x: x.shape, output_spec)
+
+    def call(self, inputs):
+        """Computes output tensors for new inputs."""
+        self._assert_input_compatibility(inputs)
+        return self._run_through_graph(inputs, operation_fn=lambda op: op)
+
+    def _run_through_graph(self, inputs, operation_fn, call_fn=None):
+        """Execute the graph.
+
+        At each node we compute outputs via
+        `operation_fn(node.operation)(*args, **kwargs)`.
+        """
+        inputs = tree.flatten(inputs)
+
+        # Dictionary mapping reference tensors to computed tensors.
+        tensor_dict = {}
+        for x, y in zip(self.inputs, inputs):
+            tensor_dict[id(x)] = y
+
+        nodes_by_depth = self._nodes_by_depth
+        depth_keys = list(nodes_by_depth.keys())
+        depth_keys.sort(reverse=True)
+
+        for depth in depth_keys:
+            nodes = nodes_by_depth[depth]
+            for node in nodes:
+                if not node.operation or node.is_input:
+                    continue  # Input tensors already exist.
+
+                if any(id(x) not in tensor_dict for x in node.input_tensors):
+                    continue  # Node is not computable, try skipping.
+
+                args, kwargs = node.arguments.fill_in(tensor_dict)
+                op = operation_fn(node.operation)
+                if call_fn is not None:
+                    outputs = call_fn(op, *args, **kwargs)
+                else:
+                    outputs = op(*args, **kwargs)
+
+                # Update tensor_dict.
+                for x, y in zip(node.outputs, tree.flatten(outputs)):
+                    tensor_dict[id(x)] = y
+
+        output_tensors = []
+        for x in self.outputs:
+            output_tensors.append(tensor_dict[id(x)])
+
+        return tree.pack_sequence_as(self._outputs_struct, output_tensors)
+
+    def _assert_input_compatibility(self, inputs):
+        try:
+            tree.assert_same_structure(inputs, self._inputs_struct)
+        except ValueError:
+            raise ValueError(
+                "Function was called with an invalid input structure. "
+                f"Expected input structure: {self._inputs_struct}\n"
+                f"Received input structure: {inputs}"
+            )
+        for x, x_ref in zip(tree.flatten(inputs), self._inputs):
+            if len(x.shape) != len(x_ref.shape):
+                raise ValueError(
+                    f"{self.__class__.__name__} was passed "
+                    f"incompatible inputs. For input '{x_ref.name}', "
+                    f"expected shape {x_ref.shape}, but received "
+                    f"instead a tensor with shape {x.shape}."
+                )
+            for dim, ref_dim in zip(x.shape, x_ref.shape):
+                if ref_dim is not None and dim is not None:
+                    if dim != ref_dim:
+                        raise ValueError(
+                            f"{self.__class__.__name__} was passed "
+                            f"incompatible inputs. For input '{x_ref.name}', "
+                            f"expected shape {x_ref.shape}, but received "
+                            f"instead a tensor with shape {x.shape}."
+                        )
+
+
+def make_node_key(op, node_index):
+    return str(id(op)) + "_ib-" + str(node_index)
+
+
+def map_graph(inputs, outputs):
+    """Validates a graph's topology and gather its operations and nodes.
+
+    Args:
+        inputs: List of input tensors.
+        outputs: List of outputs tensors.
+
+    Returns:
+        A tuple `(nodes, nodes_by_depth, operations, operations_by_depth)`.
+        - nodes: set of Node instances
+        - nodes_by_depth: dict mapping ints (depth) to lists of node instances.
+        - operations: list of Operation instances.
+        - operations_by_depth: dict mapping ints (depth) to lists of Operation
+            instances.
+    """
+    # "depth" is number of operations between output Node and the Node.
+    # Nodes are ordered from inputs -> outputs.
+    nodes_in_decreasing_depth, operation_indices = _build_map(inputs, outputs)
+    network_nodes = {
+        make_node_key(node.operation, node.operation._inbound_nodes.index(node))
+        for node in nodes_in_decreasing_depth
+    }
+
+    nodes_depths = {}  # dict {node: depth value}
+    operations_depths = {}  # dict {operation: depth value}
+
+    for node in reversed(nodes_in_decreasing_depth):
+        # If the depth is not set, the node has no outbound nodes (depth 0).
+        depth = nodes_depths.setdefault(node, 0)
+
+        # Update the depth of the corresponding operation
+        previous_depth = operations_depths.get(node.operation, 0)
+        # If we've seen this operation before at a higher depth,
+        # we should use that depth instead of the node depth.
+        # This is necessary for shared operations that have inputs at different
+        # depth levels in the graph.
+        depth = max(depth, previous_depth)
+        operations_depths[node.operation] = depth
+        nodes_depths[node] = depth
+
+        # Update the depth of inbound nodes.
+        # The "depth" of a node is the max of the depths
+        # of all nodes it is connected to + 1.
+        for node_dep in node.parent_nodes:
+            previous_depth = nodes_depths.get(node_dep, 0)
+            nodes_depths[node_dep] = max(depth + 1, previous_depth)
+
+    # Handle inputs that are not connected to outputs.
+    # We do not error out here because the inputs may be used to compute losses
+    # and metrics.
+    for input_t in inputs:
+        input_operation = input_t._keras_history[0]
+        if input_operation and input_operation not in operations_depths:
+            operations_depths[input_operation] = 0
+            operation_indices[input_operation] = -1
+            nodes_depths[input_operation._inbound_nodes[0]] = 0
+            network_nodes.add(make_node_key(input_operation, 0))
+
+    # Build a dict {depth: list of nodes with this depth}
+    nodes_by_depth = collections.defaultdict(list)
+    for node, depth in nodes_depths.items():
+        nodes_by_depth[depth].append(node)
+
+    # Build a dict {depth: list of operations with this depth}
+    operations_by_depth = collections.defaultdict(list)
+    for operation, depth in operations_depths.items():
+        operations_by_depth[depth].append(operation)
+
+    # Get sorted list of operation depths.
+    depth_keys = list(operations_by_depth.keys())
+    depth_keys.sort(reverse=True)
+
+    # Set self.operations ordered by depth.
+    operations = []
+    for depth in depth_keys:
+        operations_for_depth = operations_by_depth[depth]
+        # Network.operations needs to have a deterministic order:
+        # here we order them by traversal order.
+        operations_for_depth.sort(key=lambda x: operation_indices[x])
+        operations.extend(operations_for_depth)
+
+    # Get sorted list of node depths.
+    depth_keys = list(nodes_by_depth.keys())
+    depth_keys.sort(reverse=True)
+
+    # Check that all tensors required are computable.
+    # computable_tensors: all tensors in the graph
+    # that can be computed from the inputs provided.
+    computable_tensors = set()
+    for x in inputs:
+        computable_tensors.add(x)
+
+    operations_with_complete_input = []  # To provide a better error msg.
+    for depth in depth_keys:
+        for node in nodes_by_depth[depth]:
+            for x in tree.flatten(node.input_tensors):
+                if x not in computable_tensors:
+                    operation = node.operation
+                    raise ValueError(
+                        "Graph disconnected: cannot find parent for "
+                        f"tensor {x} at operation '{operation}'. "
+                        "The following previous operations were accessed "
+                        f"without issue: {operations_with_complete_input}"
+                    )
+                operations_with_complete_input.append(node.operation.name)
+
+            for x in tree.flatten(node.outputs):
+                computable_tensors.add(x)
+
+    # Ensure name unicity, which will be crucial for serialization
+    # (since serialized nodes refer to operations by their name).
+    all_names = [operation.name for operation in operations]
+    for name in all_names:
+        if all_names.count(name) != 1:
+            raise ValueError(
+                f'The name "{name}" is used {all_names.count(name)} '
+                "times in the model. All operation names should be unique."
+            )
+    return network_nodes, nodes_by_depth, operations, operations_by_depth
+
+
+def _build_map(inputs, outputs):
+    """Topologically sort nodes in order from inputs to outputs.
+
+    It uses a depth-first search to topologically sort nodes that appear in the
+    _keras_history connectivity metadata of `outputs`.
+
+    Args:
+        outputs: the output tensors whose _keras_history metadata should be
+                walked. This may be an arbitrary nested structure.
+
+    Returns:
+        A tuple like (ordered_nodes, operation_to_first_traversal_index)
+        ordered_nodes: list of nodes appearing in the keras history,
+            topologically sorted from original inputs to the `outputs`.
+            (If outputs have different sets of ancestors, the inputs to one
+            output may appear after a different output).
+        operation_to_first_traversal_index:
+            A dict mapping operation to the traversal index in the DFS where it
+            is seen. Note: if a operation is shared by several nodes, the dict
+            will onlystore the index corresponding to the *first* time the
+            operation seen.
+    """
+    finished_nodes = set()
+    nodes_in_progress = set()
+    nodes_in_decreasing_depth = []  # nodes from inputs -> outputs.
+    operation_indices = {}  # operation -> in traversal order.
+    for output in tree.flatten(outputs):
+        _build_map_helper(
+            inputs,
+            output,
+            finished_nodes,
+            nodes_in_progress,
+            nodes_in_decreasing_depth,
+            operation_indices,
+        )
+    return nodes_in_decreasing_depth, operation_indices
+
+
+def _build_map_helper(
+    inputs,
+    tensor,
+    finished_nodes,
+    nodes_in_progress,
+    nodes_in_decreasing_depth,
+    operation_indices,
+):
+    """Recursive helper for `_build_map`."""
+    (
+        operation,
+        node_index,
+        _,
+    ) = tensor._keras_history
+    if not operation:
+        return
+
+    node = operation._inbound_nodes[node_index]
+
+    # Don't repeat work for shared subgraphs
+    if node in finished_nodes:
+        return
+
+    # Prevent cycles.
+    if node in nodes_in_progress:
+        raise ValueError(
+            f"Tensor {tensor} from operation '{operation.name}' is part of a "
+            "cycle."
+        )
+
+    # Store the traversal order for operation sorting.
+    if operation not in operation_indices:
+        operation_indices[operation] = len(operation_indices)
+
+    # Propagate to all previous tensors connected to this node.
+    nodes_in_progress.add(node)
+    if not node.is_input and tensor not in tree.flatten(inputs):
+        for tensor in node.input_tensors:
+            _build_map_helper(
+                inputs,
+                tensor,
+                finished_nodes,
+                nodes_in_progress,
+                nodes_in_decreasing_depth,
+                operation_indices,
+            )
+
+    finished_nodes.add(node)
+    nodes_in_progress.remove(node)
+    nodes_in_decreasing_depth.append(node)
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/image.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/image.py
new file mode 100644
index 0000000000000000000000000000000000000000..ee397cbb6669262961d012149ef5371b4a9b77d2
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/image.py
@@ -0,0 +1,1235 @@
+from keras.src import backend
+from keras.src import ops
+from keras.src.api_export import keras_export
+from keras.src.backend import KerasTensor
+from keras.src.backend import any_symbolic_tensors
+from keras.src.ops.operation import Operation
+from keras.src.ops.operation_utils import compute_conv_output_shape
+
+
+class RGBToGrayscale(Operation):
+    def __init__(self, data_format=None):
+        super().__init__()
+        self.data_format = backend.standardize_data_format(data_format)
+
+    def call(self, images):
+        return backend.image.rgb_to_grayscale(
+            images, data_format=self.data_format
+        )
+
+    def compute_output_spec(self, images):
+        images_shape = list(images.shape)
+        if len(images_shape) not in (3, 4):
+            raise ValueError(
+                "Invalid images rank: expected rank 3 (single image) "
+                "or rank 4 (batch of images). "
+                f"Received: images.shape={images_shape}"
+            )
+        if self.data_format == "channels_last":
+            images_shape[-1] = 1
+        else:
+            images_shape[-3] = 1
+        return KerasTensor(shape=images_shape, dtype=images.dtype)
+
+
+@keras_export("keras.ops.image.rgb_to_grayscale")
+def rgb_to_grayscale(images, data_format=None):
+    """Convert RGB images to grayscale.
+
+    This function converts RGB images to grayscale images. It supports both
+    3D and 4D tensors.
+
+    Args:
+        images: Input image or batch of images. Must be 3D or 4D.
+        data_format: A string specifying the data format of the input tensor.
+            It can be either `"channels_last"` or `"channels_first"`.
+            `"channels_last"` corresponds to inputs with shape
+            `(batch, height, width, channels)`, while `"channels_first"`
+            corresponds to inputs with shape `(batch, channels, height, width)`.
+            If not specified, the value will default to
+            `keras.config.image_data_format`.
+
+    Returns:
+        Grayscale image or batch of grayscale images.
+
+    Examples:
+
+    >>> import numpy as np
+    >>> from keras import ops
+    >>> x = np.random.random((2, 4, 4, 3))
+    >>> y = ops.image.rgb_to_grayscale(x)
+    >>> y.shape
+    (2, 4, 4, 1)
+
+    >>> x = np.random.random((4, 4, 3)) # Single RGB image
+    >>> y = ops.image.rgb_to_grayscale(x)
+    >>> y.shape
+    (4, 4, 1)
+
+    >>> x = np.random.random((2, 3, 4, 4))
+    >>> y = ops.image.rgb_to_grayscale(x, data_format="channels_first")
+    >>> y.shape
+    (2, 1, 4, 4)
+    """
+    if any_symbolic_tensors((images,)):
+        return RGBToGrayscale(data_format=data_format).symbolic_call(images)
+    return backend.image.rgb_to_grayscale(images, data_format=data_format)
+
+
+class RGBToHSV(Operation):
+    def __init__(self, data_format=None):
+        super().__init__()
+        self.data_format = backend.standardize_data_format(data_format)
+
+    def call(self, images):
+        return backend.image.rgb_to_hsv(images, data_format=self.data_format)
+
+    def compute_output_spec(self, images):
+        images_shape = list(images.shape)
+        dtype = images.dtype
+        if len(images_shape) not in (3, 4):
+            raise ValueError(
+                "Invalid images rank: expected rank 3 (single image) "
+                "or rank 4 (batch of images). "
+                f"Received: images.shape={images_shape}"
+            )
+        if not backend.is_float_dtype(dtype):
+            raise ValueError(
+                "Invalid images dtype: expected float dtype. "
+                f"Received: images.dtype={dtype}"
+            )
+        return KerasTensor(shape=images_shape, dtype=images.dtype)
+
+
+@keras_export("keras.ops.image.rgb_to_hsv")
+def rgb_to_hsv(images, data_format=None):
+    """Convert RGB images to HSV.
+
+    `images` must be of float dtype, and the output is only well defined if the
+    values in `images` are in `[0, 1]`.
+
+    All HSV values are in `[0, 1]`. A hue of `0` corresponds to pure red, `1/3`
+    is pure green, and `2/3` is pure blue.
+
+    Args:
+        images: Input image or batch of images. Must be 3D or 4D.
+        data_format: A string specifying the data format of the input tensor.
+            It can be either `"channels_last"` or `"channels_first"`.
+            `"channels_last"` corresponds to inputs with shape
+            `(batch, height, width, channels)`, while `"channels_first"`
+            corresponds to inputs with shape `(batch, channels, height, width)`.
+            If not specified, the value will default to
+            `keras.config.image_data_format`.
+
+    Returns:
+        HSV image or batch of HSV images.
+
+    Examples:
+
+    >>> import numpy as np
+    >>> from keras import ops
+    >>> x = np.random.random((2, 4, 4, 3))
+    >>> y = ops.image.rgb_to_hsv(x)
+    >>> y.shape
+    (2, 4, 4, 3)
+
+    >>> x = np.random.random((4, 4, 3)) # Single RGB image
+    >>> y = ops.image.rgb_to_hsv(x)
+    >>> y.shape
+    (4, 4, 3)
+
+    >>> x = np.random.random((2, 3, 4, 4))
+    >>> y = ops.image.rgb_to_hsv(x, data_format="channels_first")
+    >>> y.shape
+    (2, 3, 4, 4)
+    """
+    if any_symbolic_tensors((images,)):
+        return RGBToHSV(data_format=data_format).symbolic_call(images)
+    return backend.image.rgb_to_hsv(images, data_format=data_format)
+
+
+class HSVToRGB(Operation):
+    def __init__(self, data_format=None):
+        super().__init__()
+        self.data_format = backend.standardize_data_format(data_format)
+
+    def call(self, images):
+        return backend.image.hsv_to_rgb(images, data_format=self.data_format)
+
+    def compute_output_spec(self, images):
+        images_shape = list(images.shape)
+        dtype = images.dtype
+        if len(images_shape) not in (3, 4):
+            raise ValueError(
+                "Invalid images rank: expected rank 3 (single image) "
+                "or rank 4 (batch of images). "
+                f"Received: images.shape={images_shape}"
+            )
+        if not backend.is_float_dtype(dtype):
+            raise ValueError(
+                "Invalid images dtype: expected float dtype. "
+                f"Received: images.dtype={dtype}"
+            )
+        return KerasTensor(shape=images_shape, dtype=images.dtype)
+
+
+@keras_export("keras.ops.image.hsv_to_rgb")
+def hsv_to_rgb(images, data_format=None):
+    """Convert HSV images to RGB.
+
+    `images` must be of float dtype, and the output is only well defined if the
+    values in `images` are in `[0, 1]`.
+
+    Args:
+        images: Input image or batch of images. Must be 3D or 4D.
+        data_format: A string specifying the data format of the input tensor.
+            It can be either `"channels_last"` or `"channels_first"`.
+            `"channels_last"` corresponds to inputs with shape
+            `(batch, height, width, channels)`, while `"channels_first"`
+            corresponds to inputs with shape `(batch, channels, height, width)`.
+            If not specified, the value will default to
+            `keras.config.image_data_format`.
+
+    Returns:
+        RGB image or batch of RGB images.
+
+    Examples:
+
+    >>> import numpy as np
+    >>> from keras import ops
+    >>> x = np.random.random((2, 4, 4, 3))
+    >>> y = ops.image.hsv_to_rgb(x)
+    >>> y.shape
+    (2, 4, 4, 3)
+
+    >>> x = np.random.random((4, 4, 3)) # Single HSV image
+    >>> y = ops.image.hsv_to_rgb(x)
+    >>> y.shape
+    (4, 4, 3)
+
+    >>> x = np.random.random((2, 3, 4, 4))
+    >>> y = ops.image.hsv_to_rgb(x, data_format="channels_first")
+    >>> y.shape
+    (2, 3, 4, 4)
+    """
+    if any_symbolic_tensors((images,)):
+        return HSVToRGB(data_format=data_format).symbolic_call(images)
+    return backend.image.hsv_to_rgb(images, data_format=data_format)
+
+
+class Resize(Operation):
+    def __init__(
+        self,
+        size,
+        interpolation="bilinear",
+        antialias=False,
+        crop_to_aspect_ratio=False,
+        pad_to_aspect_ratio=False,
+        fill_mode="constant",
+        fill_value=0.0,
+        data_format=None,
+    ):
+        super().__init__()
+        self.size = tuple(size)
+        self.interpolation = interpolation
+        self.antialias = antialias
+        self.crop_to_aspect_ratio = crop_to_aspect_ratio
+        self.pad_to_aspect_ratio = pad_to_aspect_ratio
+        self.fill_mode = fill_mode
+        self.fill_value = fill_value
+        self.data_format = backend.standardize_data_format(data_format)
+
+    def call(self, images):
+        return _resize(
+            images,
+            self.size,
+            interpolation=self.interpolation,
+            antialias=self.antialias,
+            data_format=self.data_format,
+            crop_to_aspect_ratio=self.crop_to_aspect_ratio,
+            pad_to_aspect_ratio=self.pad_to_aspect_ratio,
+            fill_mode=self.fill_mode,
+            fill_value=self.fill_value,
+        )
+
+    def compute_output_spec(self, images):
+        images_shape = list(images.shape)
+        if len(images_shape) not in (3, 4):
+            raise ValueError(
+                "Invalid images rank: expected rank 3 (single image) "
+                "or rank 4 (batch of images). Received input with shape: "
+                f"images.shape={images.shape}"
+            )
+        if self.data_format == "channels_last":
+            height_axis, width_axis = -3, -2
+        else:
+            height_axis, width_axis = -2, -1
+        images_shape[height_axis] = self.size[0]
+        images_shape[width_axis] = self.size[1]
+        return KerasTensor(shape=images_shape, dtype=images.dtype)
+
+
+@keras_export("keras.ops.image.resize")
+def resize(
+    images,
+    size,
+    interpolation="bilinear",
+    antialias=False,
+    crop_to_aspect_ratio=False,
+    pad_to_aspect_ratio=False,
+    fill_mode="constant",
+    fill_value=0.0,
+    data_format=None,
+):
+    """Resize images to size using the specified interpolation method.
+
+    Args:
+        images: Input image or batch of images. Must be 3D or 4D.
+        size: Size of output image in `(height, width)` format.
+        interpolation: Interpolation method. Available methods are `"nearest"`,
+            `"bilinear"`, and `"bicubic"`. Defaults to `"bilinear"`.
+        antialias: Whether to use an antialiasing filter when downsampling an
+            image. Defaults to `False`.
+        crop_to_aspect_ratio: If `True`, resize the images without aspect
+            ratio distortion. When the original aspect ratio differs
+            from the target aspect ratio, the output image will be
+            cropped so as to return the
+            largest possible window in the image (of size `(height, width)`)
+            that matches the target aspect ratio. By default
+            (`crop_to_aspect_ratio=False`), aspect ratio may not be preserved.
+        pad_to_aspect_ratio: If `True`, pad the images without aspect
+            ratio distortion. When the original aspect ratio differs
+            from the target aspect ratio, the output image will be
+            evenly padded on the short side.
+        fill_mode: When using `pad_to_aspect_ratio=True`, padded areas
+            are filled according to the given mode. Only `"constant"` is
+            supported at this time
+            (fill with constant value, equal to `fill_value`).
+        fill_value: Float. Padding value to use when `pad_to_aspect_ratio=True`.
+        data_format: A string specifying the data format of the input tensor.
+            It can be either `"channels_last"` or `"channels_first"`.
+            `"channels_last"` corresponds to inputs with shape
+            `(batch, height, width, channels)`, while `"channels_first"`
+            corresponds to inputs with shape `(batch, channels, height, width)`.
+            If not specified, the value will default to
+            `keras.config.image_data_format`.
+
+    Returns:
+        Resized image or batch of images.
+
+    Examples:
+
+    >>> x = np.random.random((2, 4, 4, 3)) # batch of 2 RGB images
+    >>> y = keras.ops.image.resize(x, (2, 2))
+    >>> y.shape
+    (2, 2, 2, 3)
+
+    >>> x = np.random.random((4, 4, 3)) # single RGB image
+    >>> y = keras.ops.image.resize(x, (2, 2))
+    >>> y.shape
+    (2, 2, 3)
+
+    >>> x = np.random.random((2, 3, 4, 4)) # batch of 2 RGB images
+    >>> y = keras.ops.image.resize(x, (2, 2),
+    ...     data_format="channels_first")
+    >>> y.shape
+    (2, 3, 2, 2)
+    """
+    if len(size) != 2:
+        raise ValueError(
+            "Expected `size` to be a tuple of 2 integers. "
+            f"Received: size={size}"
+        )
+    if len(images.shape) < 3 or len(images.shape) > 4:
+        raise ValueError(
+            "Invalid images rank: expected rank 3 (single image) "
+            "or rank 4 (batch of images). Received input with shape: "
+            f"images.shape={images.shape}"
+        )
+    if pad_to_aspect_ratio and crop_to_aspect_ratio:
+        raise ValueError(
+            "Only one of `pad_to_aspect_ratio` & `crop_to_aspect_ratio` "
+            "can be `True`."
+        )
+    if any_symbolic_tensors((images,)):
+        return Resize(
+            size,
+            interpolation=interpolation,
+            antialias=antialias,
+            data_format=data_format,
+            crop_to_aspect_ratio=crop_to_aspect_ratio,
+            pad_to_aspect_ratio=pad_to_aspect_ratio,
+            fill_mode=fill_mode,
+            fill_value=fill_value,
+        ).symbolic_call(images)
+    return _resize(
+        images,
+        size,
+        interpolation=interpolation,
+        antialias=antialias,
+        crop_to_aspect_ratio=crop_to_aspect_ratio,
+        data_format=data_format,
+        pad_to_aspect_ratio=pad_to_aspect_ratio,
+        fill_mode=fill_mode,
+        fill_value=fill_value,
+    )
+
+
+def _resize(
+    images,
+    size,
+    interpolation="bilinear",
+    antialias=False,
+    crop_to_aspect_ratio=False,
+    pad_to_aspect_ratio=False,
+    fill_mode="constant",
+    fill_value=0.0,
+    data_format=None,
+):
+    resized = backend.image.resize(
+        images,
+        size,
+        interpolation=interpolation,
+        antialias=antialias,
+        crop_to_aspect_ratio=crop_to_aspect_ratio,
+        data_format=data_format,
+        pad_to_aspect_ratio=pad_to_aspect_ratio,
+        fill_mode=fill_mode,
+        fill_value=fill_value,
+    )
+    if resized.dtype == images.dtype:
+        # Only `torch` backend will cast result to original dtype with
+        # correct rounding and without dtype overflow
+        return resized
+    if backend.is_int_dtype(images.dtype):
+        resized = ops.round(resized)
+    return ops.saturate_cast(resized, images.dtype)
+
+
+class AffineTransform(Operation):
+    def __init__(
+        self,
+        interpolation="bilinear",
+        fill_mode="constant",
+        fill_value=0,
+        data_format=None,
+    ):
+        super().__init__()
+        self.interpolation = interpolation
+        self.fill_mode = fill_mode
+        self.fill_value = fill_value
+        self.data_format = backend.standardize_data_format(data_format)
+
+    def call(self, images, transform):
+        return backend.image.affine_transform(
+            images,
+            transform,
+            interpolation=self.interpolation,
+            fill_mode=self.fill_mode,
+            fill_value=self.fill_value,
+            data_format=self.data_format,
+        )
+
+    def compute_output_spec(self, images, transform):
+        if len(images.shape) not in (3, 4):
+            raise ValueError(
+                "Invalid images rank: expected rank 3 (single image) "
+                "or rank 4 (batch of images). Received input with shape: "
+                f"images.shape={images.shape}"
+            )
+        if len(transform.shape) not in (1, 2):
+            raise ValueError(
+                "Invalid transform rank: expected rank 1 (single transform) "
+                "or rank 2 (batch of transforms). Received input with shape: "
+                f"transform.shape={transform.shape}"
+            )
+        return KerasTensor(images.shape, dtype=images.dtype)
+
+
+@keras_export("keras.ops.image.affine_transform")
+def affine_transform(
+    images,
+    transform,
+    interpolation="bilinear",
+    fill_mode="constant",
+    fill_value=0,
+    data_format=None,
+):
+    """Applies the given transform(s) to the image(s).
+
+    Args:
+        images: Input image or batch of images. Must be 3D or 4D.
+        transform: Projective transform matrix/matrices. A vector of length 8 or
+            tensor of size N x 8. If one row of transform is
+            `[a0, a1, a2, b0, b1, b2, c0, c1]`, then it maps the output point
+            `(x, y)` to a transformed input point
+            `(x', y') = ((a0 x + a1 y + a2) / k, (b0 x + b1 y + b2) / k)`,
+            where `k = c0 x + c1 y + 1`. The transform is inverted compared to
+            the transform mapping input points to output points. Note that
+            gradients are not backpropagated into transformation parameters.
+            Note that `c0` and `c1` are only effective when using TensorFlow
+            backend and will be considered as `0` when using other backends.
+        interpolation: Interpolation method. Available methods are `"nearest"`,
+            and `"bilinear"`. Defaults to `"bilinear"`.
+        fill_mode: Points outside the boundaries of the input are filled
+            according to the given mode. Available methods are `"constant"`,
+            `"nearest"`, `"wrap"` and `"reflect"`. Defaults to `"constant"`.
+            - `"reflect"`: `(d c b a | a b c d | d c b a)`
+                The input is extended by reflecting about the edge of the last
+                pixel.
+            - `"constant"`: `(k k k k | a b c d | k k k k)`
+                The input is extended by filling all values beyond
+                the edge with the same constant value k specified by
+                `fill_value`.
+            - `"wrap"`: `(a b c d | a b c d | a b c d)`
+                The input is extended by wrapping around to the opposite edge.
+            - `"nearest"`: `(a a a a | a b c d | d d d d)`
+                The input is extended by the nearest pixel.
+        fill_value: Value used for points outside the boundaries of the input if
+            `fill_mode="constant"`. Defaults to `0`.
+        data_format: A string specifying the data format of the input tensor.
+            It can be either `"channels_last"` or `"channels_first"`.
+            `"channels_last"` corresponds to inputs with shape
+            `(batch, height, width, channels)`, while `"channels_first"`
+            corresponds to inputs with shape `(batch, channels, height, width)`.
+            If not specified, the value will default to
+            `keras.config.image_data_format`.
+
+    Returns:
+        Applied affine transform image or batch of images.
+
+    Examples:
+
+    >>> x = np.random.random((2, 64, 80, 3)) # batch of 2 RGB images
+    >>> transform = np.array(
+    ...     [
+    ...         [1.5, 0, -20, 0, 1.5, -16, 0, 0],  # zoom
+    ...         [1, 0, -20, 0, 1, -16, 0, 0],  # translation
+    ...     ]
+    ... )
+    >>> y = keras.ops.image.affine_transform(x, transform)
+    >>> y.shape
+    (2, 64, 80, 3)
+
+    >>> x = np.random.random((64, 80, 3)) # single RGB image
+    >>> transform = np.array([1.0, 0.5, -20, 0.5, 1.0, -16, 0, 0])  # shear
+    >>> y = keras.ops.image.affine_transform(x, transform)
+    >>> y.shape
+    (64, 80, 3)
+
+    >>> x = np.random.random((2, 3, 64, 80)) # batch of 2 RGB images
+    >>> transform = np.array(
+    ...     [
+    ...         [1.5, 0, -20, 0, 1.5, -16, 0, 0],  # zoom
+    ...         [1, 0, -20, 0, 1, -16, 0, 0],  # translation
+    ...     ]
+    ... )
+    >>> y = keras.ops.image.affine_transform(x, transform,
+    ...     data_format="channels_first")
+    >>> y.shape
+    (2, 3, 64, 80)
+    """
+    if any_symbolic_tensors((images, transform)):
+        return AffineTransform(
+            interpolation=interpolation,
+            fill_mode=fill_mode,
+            fill_value=fill_value,
+            data_format=data_format,
+        ).symbolic_call(images, transform)
+    return backend.image.affine_transform(
+        images,
+        transform,
+        interpolation=interpolation,
+        fill_mode=fill_mode,
+        fill_value=fill_value,
+        data_format=data_format,
+    )
+
+
+class ExtractPatches(Operation):
+    def __init__(
+        self,
+        size,
+        strides=None,
+        dilation_rate=1,
+        padding="valid",
+        data_format=None,
+    ):
+        super().__init__()
+        if isinstance(size, int):
+            size = (size, size)
+        self.size = size
+        self.strides = strides
+        self.dilation_rate = dilation_rate
+        self.padding = padding
+        self.data_format = backend.standardize_data_format(data_format)
+
+    def call(self, images):
+        return _extract_patches(
+            images=images,
+            size=self.size,
+            strides=self.strides,
+            dilation_rate=self.dilation_rate,
+            padding=self.padding,
+            data_format=self.data_format,
+        )
+
+    def compute_output_spec(self, images):
+        images_shape = list(images.shape)
+        original_ndim = len(images_shape)
+        if not self.strides:
+            strides = (self.size[0], self.size[1])
+        if self.data_format == "channels_last":
+            channels_in = images_shape[-1]
+        else:
+            channels_in = images_shape[-3]
+        if original_ndim == 3:
+            images_shape = [1] + images_shape
+        filters = self.size[0] * self.size[1] * channels_in
+        kernel_size = (self.size[0], self.size[1])
+        out_shape = compute_conv_output_shape(
+            images_shape,
+            filters,
+            kernel_size,
+            strides=strides,
+            padding=self.padding,
+            data_format=self.data_format,
+            dilation_rate=self.dilation_rate,
+        )
+        if original_ndim == 3:
+            out_shape = out_shape[1:]
+        return KerasTensor(shape=out_shape, dtype=images.dtype)
+
+
+@keras_export("keras.ops.image.extract_patches")
+def extract_patches(
+    images,
+    size,
+    strides=None,
+    dilation_rate=1,
+    padding="valid",
+    data_format=None,
+):
+    """Extracts patches from the image(s).
+
+    Args:
+        images: Input image or batch of images. Must be 3D or 4D.
+        size: Patch size int or tuple (patch_height, patch_width)
+        strides: strides along height and width. If not specified, or
+            if `None`, it defaults to the same value as `size`.
+        dilation_rate: This is the input stride, specifying how far two
+            consecutive patch samples are in the input. For value other than 1,
+            strides must be 1. NOTE: `strides > 1` is not supported in
+            conjunction with `dilation_rate > 1`
+        padding: The type of padding algorithm to use: `"same"` or `"valid"`.
+        data_format: A string specifying the data format of the input tensor.
+            It can be either `"channels_last"` or `"channels_first"`.
+            `"channels_last"` corresponds to inputs with shape
+            `(batch, height, width, channels)`, while `"channels_first"`
+            corresponds to inputs with shape `(batch, channels, height, width)`.
+            If not specified, the value will default to
+            `keras.config.image_data_format`.
+
+    Returns:
+        Extracted patches 3D (if not batched) or 4D (if batched)
+
+    Examples:
+
+    >>> image = np.random.random(
+    ...     (2, 20, 20, 3)
+    ... ).astype("float32") # batch of 2 RGB images
+    >>> patches = keras.ops.image.extract_patches(image, (5, 5))
+    >>> patches.shape
+    (2, 4, 4, 75)
+    >>> image = np.random.random((20, 20, 3)).astype("float32") # 1 RGB image
+    >>> patches = keras.ops.image.extract_patches(image, (3, 3), (1, 1))
+    >>> patches.shape
+    (18, 18, 27)
+    """
+    if any_symbolic_tensors((images,)):
+        return ExtractPatches(
+            size=size,
+            strides=strides,
+            dilation_rate=dilation_rate,
+            padding=padding,
+            data_format=data_format,
+        ).symbolic_call(images)
+
+    return _extract_patches(
+        images, size, strides, dilation_rate, padding, data_format=data_format
+    )
+
+
+def _extract_patches(
+    images,
+    size,
+    strides=None,
+    dilation_rate=1,
+    padding="valid",
+    data_format=None,
+):
+    if isinstance(size, int):
+        patch_h = patch_w = size
+    elif len(size) == 2:
+        patch_h, patch_w = size[0], size[1]
+    else:
+        raise TypeError(
+            "Invalid `size` argument. Expected an "
+            f"int or a tuple of length 2. Received: size={size}"
+        )
+    data_format = backend.standardize_data_format(data_format)
+    if data_format == "channels_last":
+        channels_in = images.shape[-1]
+    elif data_format == "channels_first":
+        channels_in = images.shape[-3]
+    if not strides:
+        strides = size
+    out_dim = patch_h * patch_w * channels_in
+    kernel = backend.numpy.eye(out_dim, dtype=images.dtype)
+    kernel = backend.numpy.reshape(
+        kernel, (patch_h, patch_w, channels_in, out_dim)
+    )
+    _unbatched = False
+    if len(images.shape) == 3:
+        _unbatched = True
+        images = backend.numpy.expand_dims(images, axis=0)
+    patches = backend.nn.conv(
+        inputs=images,
+        kernel=kernel,
+        strides=strides,
+        padding=padding,
+        data_format=data_format,
+        dilation_rate=dilation_rate,
+    )
+    if _unbatched:
+        patches = backend.numpy.squeeze(patches, axis=0)
+    return patches
+
+
+class MapCoordinates(Operation):
+    def __init__(self, order, fill_mode="constant", fill_value=0):
+        super().__init__()
+        self.order = order
+        self.fill_mode = fill_mode
+        self.fill_value = fill_value
+
+    def call(self, inputs, coordinates):
+        return backend.image.map_coordinates(
+            inputs,
+            coordinates,
+            order=self.order,
+            fill_mode=self.fill_mode,
+            fill_value=self.fill_value,
+        )
+
+    def compute_output_spec(self, inputs, coordinates):
+        if coordinates.shape[0] != len(inputs.shape):
+            raise ValueError(
+                "First dim of `coordinates` must be the same as the rank of "
+                "`inputs`. "
+                f"Received inputs with shape: {inputs.shape} and coordinate "
+                f"leading dim of {coordinates.shape[0]}"
+            )
+        if len(coordinates.shape) < 2:
+            raise ValueError(
+                "Invalid coordinates rank: expected at least rank 2."
+                f" Received input with shape: {coordinates.shape}"
+            )
+        return KerasTensor(coordinates.shape[1:], dtype=inputs.dtype)
+
+
+@keras_export("keras.ops.image.map_coordinates")
+def map_coordinates(
+    inputs, coordinates, order, fill_mode="constant", fill_value=0
+):
+    """Map the input array to new coordinates by interpolation.
+
+    Note that interpolation near boundaries differs from the scipy function,
+    because we fixed an outstanding bug
+    [scipy/issues/2640](https://github.com/scipy/scipy/issues/2640).
+
+    Args:
+        inputs: The input array.
+        coordinates: The coordinates at which inputs is evaluated.
+        order: The order of the spline interpolation. The order must be `0` or
+            `1`. `0` indicates the nearest neighbor and `1` indicates the linear
+            interpolation.
+        fill_mode: Points outside the boundaries of the inputs are filled
+            according to the given mode. Available methods are `"constant"`,
+            `"nearest"`, `"wrap"` and `"mirror"` and `"reflect"`. Defaults to
+            `"constant"`.
+            - `"constant"`: `(k k k k | a b c d | k k k k)`
+                The inputs is extended by filling all values beyond
+                the edge with the same constant value k specified by
+                `fill_value`.
+            - `"nearest"`: `(a a a a | a b c d | d d d d)`
+                The inputs is extended by the nearest pixel.
+            - `"wrap"`: `(a b c d | a b c d | a b c d)`
+                The inputs is extended by wrapping around to the opposite edge.
+            - `"mirror"`: `(c d c b | a b c d | c b a b)`
+                The inputs is extended by mirroring about the edge.
+            - `"reflect"`: `(d c b a | a b c d | d c b a)`
+                The inputs is extended by reflecting about the edge of the last
+                pixel.
+        fill_value: Value used for points outside the boundaries of the inputs
+            if `fill_mode="constant"`. Defaults to `0`.
+
+    Returns:
+        Output input or batch of inputs.
+
+    """
+    if any_symbolic_tensors((inputs, coordinates)):
+        return MapCoordinates(
+            order,
+            fill_mode,
+            fill_value,
+        ).symbolic_call(inputs, coordinates)
+    return backend.image.map_coordinates(
+        inputs,
+        coordinates,
+        order,
+        fill_mode,
+        fill_value,
+    )
+
+
+class PadImages(Operation):
+    def __init__(
+        self,
+        top_padding=None,
+        left_padding=None,
+        bottom_padding=None,
+        right_padding=None,
+        target_height=None,
+        target_width=None,
+        data_format=None,
+    ):
+        super().__init__()
+        self.top_padding = top_padding
+        self.left_padding = left_padding
+        self.bottom_padding = bottom_padding
+        self.right_padding = right_padding
+        self.target_height = target_height
+        self.target_width = target_width
+        self.data_format = backend.standardize_data_format(data_format)
+
+    def call(self, images):
+        return _pad_images(
+            images,
+            self.top_padding,
+            self.left_padding,
+            self.bottom_padding,
+            self.right_padding,
+            self.target_height,
+            self.target_width,
+            self.data_format,
+        )
+
+    def compute_output_spec(self, images):
+        images_shape = list(images.shape)
+
+        if self.data_format == "channels_last":
+            height_axis, width_axis = -3, -2
+            height, width = images_shape[height_axis], images_shape[width_axis]
+        else:
+            height_axis, width_axis = -2, -1
+            height, width = images_shape[height_axis], images_shape[width_axis]
+
+        target_height = self.target_height
+        if target_height is None and height is not None:
+            target_height = self.top_padding + height + self.bottom_padding
+        target_width = self.target_width
+        if target_width is None and width is not None:
+            target_width = self.left_padding + width + self.right_padding
+
+        images_shape[height_axis] = target_height
+        images_shape[width_axis] = target_width
+        return KerasTensor(shape=images_shape, dtype=images.dtype)
+
+
+@keras_export("keras.ops.image.pad_images")
+def pad_images(
+    images,
+    top_padding=None,
+    left_padding=None,
+    bottom_padding=None,
+    right_padding=None,
+    target_height=None,
+    target_width=None,
+    data_format=None,
+):
+    """Pad `images` with zeros to the specified `height` and `width`.
+
+    Args:
+        images: Input image or batch of images. Must be 3D or 4D.
+        top_padding: Number of rows of zeros to add on top.
+        left_padding: Number of columns of zeros to add on the left.
+        bottom_padding: Number of rows of zeros to add at the bottom.
+        right_padding: Number of columns of zeros to add on the right.
+        target_height: Height of output images.
+        target_width: Width of output images.
+        data_format: A string specifying the data format of the input tensor.
+            It can be either `"channels_last"` or `"channels_first"`.
+            `"channels_last"` corresponds to inputs with shape
+            `(batch, height, width, channels)`, while `"channels_first"`
+            corresponds to inputs with shape `(batch, channels, height, width)`.
+            If not specified, the value will default to
+            `keras.config.image_data_format`.
+
+    Returns:
+        Padded image or batch of images.
+
+    Example:
+
+    >>> images = np.random.random((15, 25, 3))
+    >>> padded_images = keras.ops.image.pad_images(
+    ...     images, 2, 3, target_height=20, target_width=30
+    ... )
+    >>> padded_images.shape
+    (20, 30, 3)
+
+    >>> batch_images = np.random.random((2, 15, 25, 3))
+    >>> padded_batch = keras.ops.image.pad_images(
+    ...     batch_images, 2, 3, target_height=20, target_width=30
+    ... )
+    >>> padded_batch.shape
+    (2, 20, 30, 3)"""
+
+    if any_symbolic_tensors((images,)):
+        return PadImages(
+            top_padding,
+            left_padding,
+            bottom_padding,
+            right_padding,
+            target_height,
+            target_width,
+            data_format,
+        ).symbolic_call(images)
+
+    return _pad_images(
+        images,
+        top_padding,
+        left_padding,
+        bottom_padding,
+        right_padding,
+        target_height,
+        target_width,
+        data_format,
+    )
+
+
+def _pad_images(
+    images,
+    top_padding,
+    left_padding,
+    bottom_padding,
+    right_padding,
+    target_height,
+    target_width,
+    data_format=None,
+):
+    data_format = backend.standardize_data_format(data_format)
+    images = backend.convert_to_tensor(images)
+    images_shape = ops.shape(images)
+
+    # Check
+    if len(images_shape) not in (3, 4):
+        raise ValueError(
+            f"Invalid shape for argument `images`: "
+            "it must have rank 3 or 4. "
+            f"Received: images.shape={images_shape}"
+        )
+    if [top_padding, bottom_padding, target_height].count(None) != 1:
+        raise ValueError(
+            "Must specify exactly two of "
+            "top_padding, bottom_padding, target_height. "
+            f"Received: top_padding={top_padding}, "
+            f"bottom_padding={bottom_padding}, "
+            f"target_height={target_height}"
+        )
+    if [left_padding, right_padding, target_width].count(None) != 1:
+        raise ValueError(
+            "Must specify exactly two of "
+            "left_padding, right_padding, target_width. "
+            f"Received: left_padding={left_padding}, "
+            f"right_padding={right_padding}, "
+            f"target_width={target_width}"
+        )
+
+    is_batch = False if len(images_shape) == 3 else True
+    if data_format == "channels_last":
+        height, width = images_shape[-3], images_shape[-2]
+    else:
+        height, width = images_shape[-2], images_shape[-1]
+
+    # Infer padding
+    if top_padding is None:
+        top_padding = target_height - bottom_padding - height
+    if bottom_padding is None:
+        bottom_padding = target_height - top_padding - height
+    if left_padding is None:
+        left_padding = target_width - right_padding - width
+    if right_padding is None:
+        right_padding = target_width - left_padding - width
+
+    if top_padding < 0:
+        raise ValueError(
+            f"top_padding must be >= 0. Received: top_padding={top_padding}"
+        )
+    if left_padding < 0:
+        raise ValueError(
+            "left_padding must be >= 0. "
+            f"Received: left_padding={left_padding}"
+        )
+    if right_padding < 0:
+        raise ValueError(
+            "right_padding must be >= 0. "
+            f"Received: right_padding={right_padding}"
+        )
+    if bottom_padding < 0:
+        raise ValueError(
+            "bottom_padding must be >= 0. "
+            f"Received: bottom_padding={bottom_padding}"
+        )
+
+    # Compute pad_width
+    pad_width = [[top_padding, bottom_padding], [left_padding, right_padding]]
+    if data_format == "channels_last":
+        pad_width = pad_width + [[0, 0]]
+    else:
+        pad_width = [[0, 0]] + pad_width
+    if is_batch:
+        pad_width = [[0, 0]] + pad_width
+
+    padded_images = backend.numpy.pad(images, pad_width)
+    return padded_images
+
+
+class CropImages(Operation):
+    def __init__(
+        self,
+        top_cropping,
+        left_cropping,
+        bottom_cropping,
+        right_cropping,
+        target_height,
+        target_width,
+        data_format=None,
+    ):
+        super().__init__()
+        self.top_cropping = top_cropping
+        self.bottom_cropping = bottom_cropping
+        self.left_cropping = left_cropping
+        self.right_cropping = right_cropping
+        self.target_height = target_height
+        self.target_width = target_width
+        self.data_format = backend.standardize_data_format(data_format)
+
+    def call(self, images):
+        return _crop_images(
+            images,
+            self.top_cropping,
+            self.left_cropping,
+            self.bottom_cropping,
+            self.right_cropping,
+            self.target_height,
+            self.target_width,
+            self.data_format,
+        )
+
+    def compute_output_spec(self, images):
+        images_shape = list(images.shape)
+
+        if self.data_format == "channels_last":
+            height_axis, width_axis = -3, -2
+        else:
+            height_axis, width_axis = -2, -1
+        height, width = images_shape[height_axis], images_shape[width_axis]
+
+        if height is None and self.target_height is None:
+            raise ValueError(
+                "When the height of the images is unknown, `target_height` "
+                "must be specified."
+                f"Received images.shape={images_shape} and "
+                f"target_height={self.target_height}"
+            )
+        if width is None and self.target_width is None:
+            raise ValueError(
+                "When the width of the images is unknown, `target_width` "
+                "must be specified."
+                f"Received images.shape={images_shape} and "
+                f"target_width={self.target_width}"
+            )
+
+        target_height = self.target_height
+        if target_height is None:
+            target_height = height - self.top_cropping - self.bottom_cropping
+        target_width = self.target_width
+        if target_width is None:
+            target_width = width - self.left_cropping - self.right_cropping
+
+        images_shape[height_axis] = target_height
+        images_shape[width_axis] = target_width
+        return KerasTensor(shape=images_shape, dtype=images.dtype)
+
+
+@keras_export("keras.ops.image.crop_images")
+def crop_images(
+    images,
+    top_cropping=None,
+    left_cropping=None,
+    bottom_cropping=None,
+    right_cropping=None,
+    target_height=None,
+    target_width=None,
+    data_format=None,
+):
+    """Crop `images` to a specified `height` and `width`.
+
+    Args:
+        images: Input image or batch of images. Must be 3D or 4D.
+        top_cropping: Number of columns to crop from the top.
+        left_cropping: Number of columns to crop from the left.
+        bottom_cropping: Number of columns to crop from the bottom.
+        right_cropping: Number of columns to crop from the right.
+        target_height: Height of the output images.
+        target_width: Width of the output images.
+        data_format: A string specifying the data format of the input tensor.
+            It can be either `"channels_last"` or `"channels_first"`.
+            `"channels_last"` corresponds to inputs with shape
+            `(batch, height, width, channels)`, while `"channels_first"`
+            corresponds to inputs with shape `(batch, channels, height, width)`.
+            If not specified, the value will default to
+            `keras.config.image_data_format`.
+
+    Returns:
+        Cropped image or batch of images.
+
+    Example:
+
+    >>> images = np.reshape(np.arange(1, 28, dtype="float32"), [3, 3, 3])
+    >>> images[:,:,0] # print the first channel of the images
+    array([[ 1.,  4.,  7.],
+           [10., 13., 16.],
+           [19., 22., 25.]], dtype=float32)
+    >>> cropped_images = keras.image.crop_images(images, 0, 0, 2, 2)
+    >>> cropped_images[:,:,0] # print the first channel of the cropped images
+    array([[ 1.,  4.],
+           [10., 13.]], dtype=float32)"""
+
+    if any_symbolic_tensors((images,)):
+        return CropImages(
+            top_cropping,
+            left_cropping,
+            bottom_cropping,
+            right_cropping,
+            target_height,
+            target_width,
+            data_format,
+        ).symbolic_call(images)
+
+    return _crop_images(
+        images,
+        top_cropping,
+        left_cropping,
+        bottom_cropping,
+        right_cropping,
+        target_height,
+        target_width,
+        data_format,
+    )
+
+
+def _crop_images(
+    images,
+    top_cropping,
+    left_cropping,
+    bottom_cropping,
+    right_cropping,
+    target_height,
+    target_width,
+    data_format=None,
+):
+    data_format = backend.standardize_data_format(data_format)
+    images = backend.convert_to_tensor(images)
+    images_shape = ops.shape(images)
+
+    # Check
+    if len(images_shape) not in (3, 4):
+        raise ValueError(
+            f"Invalid shape for argument `images`: "
+            "it must have rank 3 or 4. "
+            f"Received: images.shape={images_shape}"
+        )
+    if [top_cropping, bottom_cropping, target_height].count(None) != 1:
+        raise ValueError(
+            "Must specify exactly two of "
+            "top_cropping, bottom_cropping, target_height. "
+            f"Received: top_cropping={top_cropping}, "
+            f"bottom_cropping={bottom_cropping}, "
+            f"target_height={target_height}"
+        )
+    if [left_cropping, right_cropping, target_width].count(None) != 1:
+        raise ValueError(
+            "Must specify exactly two of "
+            "left_cropping, right_cropping, target_width. "
+            f"Received: left_cropping={left_cropping}, "
+            f"right_cropping={right_cropping}, "
+            f"target_width={target_width}"
+        )
+
+    is_batch = False if len(images_shape) == 3 else True
+    if data_format == "channels_last":
+        height, width = images_shape[-3], images_shape[-2]
+        channels = images_shape[-1]
+    else:
+        height, width = images_shape[-2], images_shape[-1]
+        channels = images_shape[-3]
+
+    # Infer padding
+    if top_cropping is None:
+        top_cropping = height - target_height - bottom_cropping
+    if target_height is None:
+        target_height = height - bottom_cropping - top_cropping
+    if left_cropping is None:
+        left_cropping = width - target_width - right_cropping
+    if target_width is None:
+        target_width = width - right_cropping - left_cropping
+
+    if top_cropping < 0:
+        raise ValueError(
+            "top_cropping must be >= 0. "
+            f"Received: top_cropping={top_cropping}"
+        )
+    if target_height < 0:
+        raise ValueError(
+            "target_height must be >= 0. "
+            f"Received: target_height={target_height}"
+        )
+    if left_cropping < 0:
+        raise ValueError(
+            "left_cropping must be >= 0. "
+            f"Received: left_cropping={left_cropping}"
+        )
+    if target_width < 0:
+        raise ValueError(
+            "target_width must be >= 0. "
+            f"Received: target_width={target_width}"
+        )
+
+    # Compute start_indices and shape
+    start_indices = [top_cropping, left_cropping]
+    shape = [target_height, target_width]
+    if data_format == "channels_last":
+        start_indices = start_indices + [0]
+        shape = shape + [channels]
+    else:
+        start_indices = [0] + start_indices
+        shape = [channels] + shape
+    if is_batch:
+        batch_size = images_shape[0]
+        start_indices = [0] + start_indices
+        shape = [batch_size] + shape
+
+    cropped_images = ops.slice(images, start_indices, shape)
+    return cropped_images
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/linalg.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/linalg.py
new file mode 100644
index 0000000000000000000000000000000000000000..0ecd170c77376bb972aed45ed38cbe11efeace47
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/linalg.py
@@ -0,0 +1,707 @@
+from keras.src import backend
+from keras.src.api_export import keras_export
+from keras.src.backend import KerasTensor
+from keras.src.backend import any_symbolic_tensors
+from keras.src.ops.operation import Operation
+from keras.src.ops.operation_utils import reduce_shape
+
+
+class Cholesky(Operation):
+    def __init__(self):
+        super().__init__()
+
+    def call(self, x):
+        return _cholesky(x)
+
+    def compute_output_spec(self, x):
+        _assert_2d(x)
+        _assert_square(x)
+        return KerasTensor(x.shape, x.dtype)
+
+
+@keras_export(["keras.ops.cholesky", "keras.ops.linalg.cholesky"])
+def cholesky(x):
+    """Computes the Cholesky decomposition of a positive semi-definite matrix.
+
+    Args:
+        x: Input tensor of shape `(..., M, M)`.
+
+    Returns:
+        A tensor of shape `(..., M, M)` representing the lower triangular
+        Cholesky factor of `x`.
+
+    """
+    if any_symbolic_tensors((x,)):
+        return Cholesky().symbolic_call(x)
+    return _cholesky(x)
+
+
+def _cholesky(x):
+    x = backend.convert_to_tensor(x)
+    _assert_2d(x)
+    _assert_square(x)
+    try:
+        return backend.linalg.cholesky(x)
+    except Exception as e:
+        raise ValueError(f"Cholesky decomposition failed: {e}")
+
+
+class Det(Operation):
+    def __init__(self):
+        super().__init__()
+
+    def call(self, x):
+        return _det(x)
+
+    def compute_output_spec(self, x):
+        _assert_2d(x)
+        _assert_square(x)
+        return KerasTensor(x.shape[:-2], x.dtype)
+
+
+@keras_export(["keras.ops.det", "keras.ops.linalg.det"])
+def det(x):
+    """Computes the determinant of a square tensor.
+
+    Args:
+        x: Input tensor of shape `(..., M, M)`.
+
+    Returns:
+        A tensor of shape `(...,)` representing the determinant of `x`.
+
+    """
+    if any_symbolic_tensors((x,)):
+        return Det().symbolic_call(x)
+    return _det(x)
+
+
+def _det(x):
+    x = backend.convert_to_tensor(x)
+    _assert_2d(x)
+    _assert_square(x)
+    return backend.linalg.det(x)
+
+
+class Eig(Operation):
+    def __init__(self):
+        super().__init__()
+
+    def call(self, x):
+        return _eig(x)
+
+    def compute_output_spec(self, x):
+        _assert_square(x)
+        _assert_2d(x)
+        return (
+            KerasTensor(x.shape[:-1], x.dtype),
+            KerasTensor(x.shape, x.dtype),
+        )
+
+
+@keras_export(["keras.ops.eig", "keras.ops.linalg.eig"])
+def eig(x):
+    """Computes the eigenvalues and eigenvectors of a square matrix.
+
+    Args:
+        x: Input tensor of shape `(..., M, M)`.
+
+    Returns:
+        A tuple of two tensors: a tensor of shape `(..., M)` containing
+        eigenvalues and a tensor of shape `(..., M, M)` containing eigenvectors.
+    """
+    if any_symbolic_tensors((x,)):
+        return Eig().symbolic_call(x)
+    return _eig(x)
+
+
+def _eig(x):
+    x = backend.convert_to_tensor(x)
+    _assert_square(x)
+    _assert_2d(x)
+    return backend.linalg.eig(x)
+
+
+class Eigh(Operation):
+    def __init__(self):
+        super().__init__()
+
+    def call(self, x):
+        return _eigh(x)
+
+    def compute_output_spec(self, x):
+        _assert_square(x)
+        _assert_2d(x)
+        return (
+            KerasTensor(x.shape[:-1], x.dtype),
+            KerasTensor(x.shape, x.dtype),
+        )
+
+
+@keras_export(["keras.ops.eigh", "keras.ops.linalg.eigh"])
+def eigh(x):
+    """Computes the eigenvalues and eigenvectors of a complex Hermitian.
+
+    Args:
+        x: Input tensor of shape `(..., M, M)`.
+
+    Returns:
+        A tuple of two tensors: a tensor of shape `(..., M)` containing
+        eigenvalues and a tensor of shape `(..., M, M)` containing eigenvectors.
+
+    """
+    if any_symbolic_tensors((x,)):
+        return Eigh().symbolic_call(x)
+    return _eigh(x)
+
+
+def _eigh(x):
+    x = backend.convert_to_tensor(x)
+    _assert_square(x)
+    _assert_2d(x)
+    return backend.linalg.eigh(x)
+
+
+class Inv(Operation):
+    def __init__(self):
+        super().__init__()
+
+    def call(self, x):
+        return _inv(x)
+
+    def compute_output_spec(self, x):
+        _assert_2d(x)
+        _assert_square(x)
+        return KerasTensor(x.shape, x.dtype)
+
+
+@keras_export(["keras.ops.inv", "keras.ops.linalg.inv"])
+def inv(x):
+    """Computes the inverse of a square tensor.
+
+    Args:
+        x: Input tensor of shape `(..., M, M)`.
+
+    Returns:
+        A tensor of shape `(..., M, M)` representing the inverse of `x`.
+
+    """
+    if any_symbolic_tensors((x,)):
+        return Inv().symbolic_call(x)
+    return _inv(x)
+
+
+def _inv(x):
+    x = backend.convert_to_tensor(x)
+    _assert_2d(x)
+    _assert_square(x)
+    return backend.linalg.inv(x)
+
+
+class LuFactor(Operation):
+    def __init__(self):
+        super().__init__()
+
+    def call(self, x):
+        return _lu_factor(x)
+
+    def compute_output_spec(self, x):
+        _assert_2d(x)
+        batch_shape = x.shape[:-2]
+        m, n = x.shape[-2:]
+        k = min(m, n)
+        return (
+            KerasTensor(batch_shape + (m, n), x.dtype),
+            KerasTensor(batch_shape + (k,), x.dtype),
+        )
+
+
+@keras_export(["keras.ops.lu_factor", "keras.ops.linalg.lu_factor"])
+def lu_factor(x):
+    """Computes the lower-upper decomposition of a square matrix.
+
+    Args:
+        x: A tensor of shape `(..., M, M)`.
+
+    Returns:
+        A tuple of two tensors: a tensor of shape `(..., M, M)` containing the
+        lower and upper triangular matrices and a tensor of shape `(..., M)`
+        containing the pivots.
+
+    """
+    if any_symbolic_tensors((x,)):
+        return LuFactor().symbolic_call(x)
+    return _lu_factor(x)
+
+
+def _lu_factor(x):
+    x = backend.convert_to_tensor(x)
+    _assert_2d(x)
+    if backend.backend() == "tensorflow":
+        try:
+            _assert_square(x)
+        except ValueError as e:
+            raise ValueError(
+                f"LU decomposition failed: {e}. LU decomposition is only "
+                "supported for square matrices in Tensorflow."
+            )
+    return backend.linalg.lu_factor(x)
+
+
+class Norm(Operation):
+    def __init__(self, ord=None, axis=None, keepdims=False):
+        super().__init__()
+        if isinstance(ord, str):
+            if ord not in ("fro", "nuc"):
+                raise ValueError(
+                    "Invalid `ord` argument. "
+                    "Expected one of {'fro', 'nuc'} when using string. "
+                    f"Received: ord={ord}"
+                )
+        if isinstance(axis, int):
+            axis = [axis]
+        self.ord = ord
+        self.axis = axis
+        self.keepdims = keepdims
+
+    def compute_output_spec(self, x):
+        output_dtype = backend.standardize_dtype(x.dtype)
+        if "int" in output_dtype or output_dtype == "bool":
+            output_dtype = backend.floatx()
+        if self.axis is None:
+            axis = tuple(range(len(x.shape)))
+        else:
+            axis = self.axis
+        num_axes = len(axis)
+        if num_axes == 1 and isinstance(self.ord, str):
+            raise ValueError(
+                "Invalid `ord` argument for vector norm. "
+                f"Received: ord={self.ord}"
+            )
+        elif num_axes == 2 and self.ord not in (
+            None,
+            "fro",
+            "nuc",
+            float("inf"),
+            float("-inf"),
+            1,
+            -1,
+            2,
+            -2,
+        ):
+            raise ValueError(
+                "Invalid `ord` argument for matrix norm. "
+                f"Received: ord={self.ord}"
+            )
+        return KerasTensor(
+            reduce_shape(x.shape, axis=self.axis, keepdims=self.keepdims),
+            dtype=output_dtype,
+        )
+
+    def call(self, x):
+        x = backend.convert_to_tensor(x)
+        return backend.linalg.norm(
+            x, ord=self.ord, axis=self.axis, keepdims=self.keepdims
+        )
+
+
+@keras_export(["keras.ops.norm", "keras.ops.linalg.norm"])
+def norm(x, ord=None, axis=None, keepdims=False):
+    """Matrix or vector norm.
+
+    This function is able to return one of eight different matrix norms, or one
+    of an infinite number of vector norms (described below), depending on the
+    value of the `ord` parameter.
+
+    Args:
+        x: Input tensor.
+        ord: Order of the norm (see table under Notes). The default is `None`.
+        axis: If `axis` is an integer, it specifies the axis of `x` along which
+            to compute the vector norms. If `axis` is a 2-tuple, it specifies
+            the axes that hold 2-D matrices, and the matrix norms of these
+            matrices are computed.
+        keepdims: If this is set to `True`, the axes which are reduced are left
+            in the result as dimensions with size one.
+
+    Note:
+        For values of `ord < 1`, the result is, strictly speaking, not a
+        mathematical 'norm', but it may still be useful for various numerical
+        purposes. The following norms can be calculated:
+        - For matrices:
+            - `ord=None`: Frobenius norm
+            - `ord="fro"`: Frobenius norm
+            - `ord="nuc"`: nuclear norm
+            - `ord=np.inf`: `max(sum(abs(x), axis=1))`
+            - `ord=-np.inf`: `min(sum(abs(x), axis=1))`
+            - `ord=0`: not supported
+            - `ord=1`: `max(sum(abs(x), axis=0))`
+            - `ord=-1`: `min(sum(abs(x), axis=0))`
+            - `ord=2`: 2-norm (largest sing. value)
+            - `ord=-2`: smallest singular value
+            - other: not supported
+        - For vectors:
+            - `ord=None`: 2-norm
+            - `ord="fro"`: not supported
+            - `ord="nuc"`: not supported
+            - `ord=np.inf`: `max(abs(x))`
+            - `ord=-np.inf`: `min(abs(x))`
+            - `ord=0`: `sum(x != 0)`
+            - `ord=1`: as below
+            - `ord=-1`: as below
+            - `ord=2`: as below
+            - `ord=-2`: as below
+            - other: `sum(abs(x)**ord)**(1./ord)`
+
+    Returns:
+        Norm of the matrix or vector(s).
+
+    Example:
+
+    >>> x = keras.ops.reshape(keras.ops.arange(9, dtype="float32") - 4, (3, 3))
+    >>> keras.ops.linalg.norm(x)
+    7.7459664
+    """
+    if any_symbolic_tensors((x,)):
+        return Norm(ord=ord, axis=axis, keepdims=keepdims).symbolic_call(x)
+    x = backend.convert_to_tensor(x)
+    return backend.linalg.norm(x, ord=ord, axis=axis, keepdims=keepdims)
+
+
+class Qr(Operation):
+    def __init__(self, mode="reduced"):
+        super().__init__()
+        if mode not in {"reduced", "complete"}:
+            raise ValueError(
+                "`mode` argument value not supported. "
+                "Expected one of {'reduced', 'complete'}. "
+                f"Received: mode={mode}"
+            )
+        self.mode = mode
+
+    def compute_output_spec(self, x):
+        if len(x.shape) < 2:
+            raise ValueError(
+                "Input should have rank >= 2. Received: "
+                f"input.shape = {x.shape}"
+            )
+        m = x.shape[-2]
+        n = x.shape[-1]
+        if m is None or n is None:
+            raise ValueError(
+                "Input should have its last 2 dimensions "
+                "fully-defined. Received: "
+                f"input.shape = {x.shape}"
+            )
+        k = min(m, n)
+        base = tuple(x.shape[:-2])
+        if self.mode == "reduced":
+            return (
+                KerasTensor(shape=base + (m, k), dtype=x.dtype),
+                KerasTensor(shape=base + (k, n), dtype=x.dtype),
+            )
+        # 'complete' mode.
+        return (
+            KerasTensor(shape=base + (m, m), dtype=x.dtype),
+            KerasTensor(shape=base + (m, n), dtype=x.dtype),
+        )
+
+    def call(self, x):
+        x = backend.convert_to_tensor(x)
+        return backend.linalg.qr(x, mode=self.mode)
+
+
+@keras_export(["keras.ops.qr", "keras.ops.linalg.qr"])
+def qr(x, mode="reduced"):
+    """Computes the QR decomposition of a tensor.
+
+    Args:
+        x: Input tensor of shape `(..., M, N)`.
+        mode: A string specifying the mode of the QR decomposition.
+            - 'reduced': Returns the reduced QR decomposition. (default)
+            - 'complete': Returns the complete QR decomposition.
+
+    Returns:
+        A tuple containing two tensors. The first tensor of shape `(..., M, K)`
+        is the orthogonal matrix `q` and the second tensor of shape
+        `(..., K, N)` is the upper triangular matrix `r`, where `K = min(M, N)`.
+
+    Example:
+
+    >>> x = keras.ops.convert_to_tensor([[1., 2.], [3., 4.], [5., 6.]])
+    >>> q, r = qr(x)
+    >>> print(q)
+    array([[-0.16903079  0.897085]
+           [-0.5070925   0.2760267 ]
+           [-0.8451542  -0.34503305]], shape=(3, 2), dtype=float32)
+    """
+    if any_symbolic_tensors((x,)):
+        return Qr(mode=mode).symbolic_call(x)
+    x = backend.convert_to_tensor(x)
+    return backend.linalg.qr(x, mode=mode)
+
+
+class Solve(Operation):
+    def __init__(self):
+        super().__init__()
+
+    def call(self, a, b):
+        return _solve(a, b)
+
+    def compute_output_spec(self, a, b):
+        _assert_2d(a)
+        _assert_square(a)
+        _assert_1d(b)
+        _assert_a_b_compat(a, b)
+        return KerasTensor(b.shape, b.dtype)
+
+
+@keras_export(["keras.ops.solve", "keras.ops.linalg.solve"])
+def solve(a, b):
+    """Solves a linear system of equations given by `a x = b`.
+
+    Args:
+        a: A tensor of shape `(..., M, M)` representing the coefficients matrix.
+        b: A tensor of shape `(..., M)` or `(..., M, N)` representing the
+        right-hand side or "dependent variable" matrix.
+
+    Returns:
+        A tensor of shape `(..., M)` or `(..., M, N)` representing the solution
+        of the linear system. Returned shape is identical to `b`.
+
+    """
+    if any_symbolic_tensors((a, b)):
+        return Solve().symbolic_call(a, b)
+    return _solve(a, b)
+
+
+def _solve(a, b):
+    a = backend.convert_to_tensor(a)
+    b = backend.convert_to_tensor(b)
+    _assert_2d(a)
+    _assert_square(a)
+    _assert_1d(b)
+    _assert_a_b_compat(a, b)
+    return backend.linalg.solve(a, b)
+
+
+class SolveTriangular(Operation):
+    def __init__(self, lower=False):
+        super().__init__()
+        self.lower = lower
+
+    def call(self, a, b):
+        return _solve_triangular(a, b, self.lower)
+
+    def compute_output_spec(self, a, b):
+        _assert_2d(a)
+        _assert_square(a)
+        _assert_1d(b)
+        _assert_a_b_compat(a, b)
+        return KerasTensor(b.shape, b.dtype)
+
+
+@keras_export(
+    ["keras.ops.solve_triangular", "keras.ops.linalg.solve_triangular"]
+)
+def solve_triangular(a, b, lower=False):
+    """Solves a linear system of equations given by `a x = b`.
+
+    Args:
+        a: A tensor of shape `(..., M, M)` representing the coefficients matrix.
+        b: A tensor of shape `(..., M)` or `(..., M, N)` representing the
+        right-hand side or "dependent variable" matrix.
+
+    Returns:
+        A tensor of shape `(..., M)` or `(..., M, N)` representing the solution
+        of the linear system. Returned shape is identical to `b`.
+
+    """
+    if any_symbolic_tensors((a, b)):
+        return SolveTriangular(lower).symbolic_call(a, b)
+    return _solve_triangular(a, b, lower)
+
+
+def _solve_triangular(a, b, lower=False):
+    a = backend.convert_to_tensor(a)
+    b = backend.convert_to_tensor(b)
+    _assert_2d(a)
+    _assert_square(a)
+    _assert_1d(b)
+    _assert_a_b_compat(a, b)
+    return backend.linalg.solve_triangular(a, b, lower)
+
+
+class SVD(Operation):
+    def __init__(self, full_matrices=True, compute_uv=True):
+        super().__init__()
+        self.full_matrices = full_matrices
+        self.compute_uv = compute_uv
+
+    def call(self, x):
+        return _svd(x, self.full_matrices, self.compute_uv)
+
+    def compute_output_spec(self, x):
+        _assert_2d(x)
+        rows, columns = x.shape[-2:]
+        batches = x.shape[:-2]
+        s_shape = batches + (min(rows, columns),)
+        if self.full_matrices:
+            u_shape = batches + (rows, rows)
+            v_shape = batches + (columns, columns)
+        else:
+            u_shape = batches + (rows, min(rows, columns))
+            v_shape = batches + (min(rows, columns), columns)
+
+        if self.compute_uv:
+            return (
+                KerasTensor(u_shape, x.dtype),
+                KerasTensor(s_shape, x.dtype),
+                KerasTensor(v_shape, x.dtype),
+            )
+        return KerasTensor(s_shape, x.dtype)
+
+
+@keras_export(["keras.ops.svd", "keras.ops.linalg.svd"])
+def svd(x, full_matrices=True, compute_uv=True):
+    """Computes the singular value decomposition of a matrix.
+
+    Args:
+        x: Input tensor of shape `(..., M, N)`.
+
+    Returns:
+        A tuple of three tensors: a tensor of shape `(..., M, M)` containing the
+        left singular vectors, a tensor of shape `(..., M, N)` containing the
+        singular values and a tensor of shape `(..., N, N)` containing the
+        right singular vectors.
+
+    """
+    if any_symbolic_tensors((x,)):
+        return SVD(full_matrices, compute_uv).symbolic_call(x)
+    return _svd(x, full_matrices, compute_uv)
+
+
+def _svd(x, full_matrices=True, compute_uv=True):
+    x = backend.convert_to_tensor(x)
+    _assert_2d(x)
+    return backend.linalg.svd(x, full_matrices, compute_uv)
+
+
+class Lstsq(Operation):
+    def __init__(self, rcond=None):
+        super().__init__()
+        self.rcond = rcond
+
+    def call(self, a, b):
+        return backend.linalg.lstsq(a, b, rcond=self.rcond)
+
+    def compute_output_spec(self, a, b):
+        if len(a.shape) != 2:
+            raise ValueError(
+                "Expected a to have rank 2. " f"Received: a.shape={a.shape}"
+            )
+        if len(b.shape) not in (1, 2):
+            raise ValueError(
+                "Expected b to have rank 1 or 2. "
+                f"Received: b.shape={b.shape}"
+            )
+        m, n = a.shape
+        if b.shape[0] != m:
+            raise ValueError(
+                "Expected b.shape[0] to be equal to "
+                "a.shape[0]. Received: "
+                f"a.shape={a.shape}, b.shape={b.shape}"
+            )
+        if len(b.shape) == 2:
+            k = b.shape[1]
+            x = KerasTensor((n, k), dtype=a.dtype)
+        else:
+            x = KerasTensor((n,), dtype=a.dtype)
+        return x
+
+
+@keras_export(["keras.ops.lstsq", "keras.ops.linalg.lstsq"])
+def lstsq(a, b, rcond=None):
+    """Return the least-squares solution to a linear matrix equation.
+
+    Computes the vector x that approximately solves the equation
+    `a @ x = b`. The equation may be under-, well-, or over-determined
+    (i.e., the number of linearly independent rows of a can be less than,
+    equal to, or greater than its number of linearly independent columns).
+    If a is square and of full rank, then `x` (but for round-off error)
+    is the exact solution of the equation. Else, `x` minimizes the
+    L2 norm of `b - a * x`.
+
+    If there are multiple minimizing solutions,
+    the one with the smallest L2 norm  is returned.
+
+    Args:
+        a: "Coefficient" matrix of shape `(M, N)`.
+        b: Ordinate or "dependent variable" values,
+            of shape `(M,)` or `(M, K)`.
+            If `b` is two-dimensional, the least-squares solution
+            is calculated for each of the K columns of `b`.
+        rcond: Cut-off ratio for small singular values of `a`.
+            For the purposes of rank determination,
+            singular values are treated as zero if they are
+            smaller than rcond times the largest
+            singular value of `a`.
+
+    Returns:
+        Tensor with shape `(N,)` or `(N, K)` containing
+        the least-squares solutions.
+
+    **NOTE:** The output differs from `numpy.linalg.lstsq`.
+    NumPy returns a tuple with four elements, the first of which
+    being the least-squares solutions and the others
+    being essentially never used.
+    Keras only returns the first value. This is done both
+    to ensure consistency across backends (which cannot be achieved
+    for the other values) and to simplify the API.
+    """
+    if any_symbolic_tensors((a, b)):
+        return Lstsq(rcond=rcond).symbolic_call(a, b)
+    return backend.linalg.lstsq(a, b, rcond=rcond)
+
+
+def _assert_1d(*arrays):
+    for a in arrays:
+        if a.ndim < 1:
+            raise ValueError(
+                "Expected input to have rank >= 1. "
+                "Received scalar input {a}."
+            )
+
+
+def _assert_2d(*arrays):
+    for a in arrays:
+        if a.ndim < 2:
+            raise ValueError(
+                "Expected input to have rank >= 2. "
+                "Received input with shape {a.shape}."
+            )
+
+
+def _assert_square(*arrays):
+    for a in arrays:
+        m, n = a.shape[-2:]
+        if m != n:
+            raise ValueError(
+                "Expected a square matrix. "
+                f"Received non-square input with shape {a.shape}"
+            )
+
+
+def _assert_a_b_compat(a, b):
+    if a.ndim == b.ndim:
+        if a.shape[-2] != b.shape[-2]:
+            raise ValueError(
+                "Incompatible shapes between `a` and `b`. "
+                "Expected `a.shape[-2] == b.shape[-2]`. "
+                f"Received: a.shape={a.shape}, b.shape={b.shape}"
+            )
+    elif a.ndim == b.ndim - 1:
+        if a.shape[-1] != b.shape[-1]:
+            raise ValueError(
+                "Incompatible shapes between `a` and `b`. "
+                "Expected `a.shape[-1] == b.shape[-1]`. "
+                f"Received: a.shape={a.shape}, b.shape={b.shape}"
+            )
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/math.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/math.py
new file mode 100644
index 0000000000000000000000000000000000000000..6cedef62cee4965e824e7f26286ac64b53529dd4
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/math.py
@@ -0,0 +1,1046 @@
+"""Commonly used math operations not included in NumPy."""
+
+from keras.src import backend
+from keras.src.api_export import keras_export
+from keras.src.backend import KerasTensor
+from keras.src.backend import any_symbolic_tensors
+from keras.src.ops.operation import Operation
+from keras.src.ops.operation_utils import reduce_shape
+
+
+def _segment_reduce_validation(data, segment_ids):
+    data_shape = data.shape
+    segment_ids_shape = segment_ids.shape
+    if len(segment_ids_shape) > 1:
+        raise ValueError(
+            "Argument `segment_ids` should be an 1-D vector, got shape: "
+            f"{len(segment_ids_shape)}. Consider either flatten input with "
+            "segment_ids.reshape((-1)) and "
+            "data.reshape((-1, ) + data.shape[len(segment_ids.shape):]) or "
+            "vectorize with vmap."
+        )
+    if (
+        segment_ids_shape[0] is not None
+        and data_shape[0] is not None
+        and segment_ids_shape[0] != data_shape[0]
+    ):
+        raise ValueError(
+            "Argument `segment_ids` and `data` should have same leading "
+            f"dimension. Got {segment_ids_shape} v.s. "
+            f"{data_shape}."
+        )
+
+
+class SegmentReduction(Operation):
+    def __init__(self, num_segments=None, sorted=False):
+        super().__init__()
+        self.num_segments = num_segments
+        self.sorted = sorted
+
+    def compute_output_spec(self, data, _):
+        output_shape = (self.num_segments,) + tuple(data.shape[1:])
+        return KerasTensor(shape=output_shape, dtype=data.dtype)
+
+
+class SegmentSum(SegmentReduction):
+    def call(self, data, segment_ids):
+        _segment_reduce_validation(data, segment_ids)
+        return backend.math.segment_sum(
+            data,
+            segment_ids,
+            num_segments=self.num_segments,
+            sorted=self.sorted,
+        )
+
+
+@keras_export("keras.ops.segment_sum")
+def segment_sum(data, segment_ids, num_segments=None, sorted=False):
+    """Computes the sum of segments in a tensor.
+
+    Args:
+        data: Input tensor.
+        segment_ids: A N-D tensor containing segment indices for each
+            element in `data`. Num dims for segment ids should be strictly
+            smaller or equal to number of dims in data.
+        num_segments: An integer representing the total number of
+            segments. If not specified, it is inferred from the maximum
+            value in `segment_ids`.
+        sorted: A boolean indicating whether `segment_ids` is sorted.
+            Defaults to `False`.
+
+    Returns:
+        A tensor containing the sum of segments, where each element
+        represents the sum of the corresponding segment in `data`.
+
+    Example:
+
+    >>> data = keras.ops.convert_to_tensor([1, 2, 10, 20, 100, 200])
+    >>> segment_ids = keras.ops.convert_to_tensor([0, 0, 1, 1, 2, 2])
+    >>> num_segments = 3
+    >>> keras.ops.segment_sum(data, segment_ids,num_segments)
+    array([3, 30, 300], dtype=int32)
+    """
+    _segment_reduce_validation(data, segment_ids)
+    if any_symbolic_tensors((data,)):
+        return SegmentSum(num_segments, sorted).symbolic_call(data, segment_ids)
+    return backend.math.segment_sum(
+        data, segment_ids, num_segments=num_segments, sorted=sorted
+    )
+
+
+class SegmentMax(SegmentReduction):
+    def call(self, data, segment_ids):
+        _segment_reduce_validation(data, segment_ids)
+        return backend.math.segment_max(
+            data,
+            segment_ids,
+            num_segments=self.num_segments,
+            sorted=self.sorted,
+        )
+
+
+@keras_export("keras.ops.segment_max")
+def segment_max(data, segment_ids, num_segments=None, sorted=False):
+    """Computes the max of segments in a tensor.
+
+    Args:
+        data: Input tensor.
+        segment_ids: A N-D tensor containing segment indices for each
+            element in `data`. data.shape[:len(segment_ids.shape)] should match.
+        num_segments: An integer representing the total number of
+            segments. If not specified, it is inferred from the maximum
+            value in `segment_ids`.
+        sorted: A boolean indicating whether `segment_ids` is sorted.
+            Defaults to `False`.
+
+    Returns:
+        A tensor containing the max of segments, where each element
+        represents the max of the corresponding segment in `data`.
+
+    Example:
+
+    >>> data = keras.ops.convert_to_tensor([1, 2, 10, 20, 100, 200])
+    >>> segment_ids = keras.ops.convert_to_tensor([0, 0, 1, 1, 2, 2])
+    >>> num_segments = 3
+    >>> keras.ops.segment_max(data, segment_ids, num_segments)
+    array([2, 20, 200], dtype=int32)
+    """
+    _segment_reduce_validation(data, segment_ids)
+    if any_symbolic_tensors((data,)):
+        return SegmentMax(num_segments, sorted).symbolic_call(data, segment_ids)
+    return backend.math.segment_max(
+        data, segment_ids, num_segments=num_segments, sorted=sorted
+    )
+
+
+class TopK(Operation):
+    def __init__(self, k, sorted=False):
+        super().__init__()
+        self.k = k
+        self.sorted = sorted
+
+    def compute_output_spec(self, x):
+        output_shape = list(x.shape)
+        output_shape[-1] = self.k
+        # Return a tuple (values, indices).
+        return (
+            KerasTensor(shape=output_shape, dtype=x.dtype),
+            KerasTensor(shape=output_shape, dtype="int32"),
+        )
+
+    def call(self, x):
+        return backend.math.top_k(x, self.k, self.sorted)
+
+
+@keras_export("keras.ops.top_k")
+def top_k(x, k, sorted=True):
+    """Finds the top-k values and their indices in a tensor.
+
+    Args:
+        x: Input tensor.
+        k: An integer representing the number of top elements to retrieve.
+        sorted: A boolean indicating whether to sort the output in
+        descending order. Defaults to `True`.
+
+    Returns:
+        A tuple containing two tensors. The first tensor contains the
+        top-k values, and the second tensor contains the indices of the
+        top-k values in the input tensor.
+
+    Example:
+
+    >>> x = keras.ops.convert_to_tensor([5, 2, 7, 1, 9, 3])
+    >>> values, indices = top_k(x, k=3)
+    >>> print(values)
+    array([9 7 5], shape=(3,), dtype=int32)
+    >>> print(indices)
+    array([4 2 0], shape=(3,), dtype=int32)
+
+    """
+    if any_symbolic_tensors((x,)):
+        return TopK(k, sorted).symbolic_call(x)
+    return backend.math.top_k(x, k, sorted)
+
+
+class InTopK(Operation):
+    def __init__(self, k):
+        super().__init__()
+        self.k = k
+
+    def compute_output_spec(self, targets, predictions):
+        return KerasTensor(shape=targets.shape, dtype="bool")
+
+    def call(self, targets, predictions):
+        return backend.math.in_top_k(targets, predictions, self.k)
+
+
+@keras_export("keras.ops.in_top_k")
+def in_top_k(targets, predictions, k):
+    """Checks if the targets are in the top-k predictions.
+
+    Args:
+        targets: A tensor of true labels.
+        predictions: A tensor of predicted labels.
+        k: An integer representing the number of predictions to consider.
+
+    Returns:
+        A boolean tensor of the same shape as `targets`, where each element
+        indicates whether the corresponding target is in the top-k predictions.
+
+    Example:
+
+    >>> targets = keras.ops.convert_to_tensor([2, 5, 3])
+    >>> predictions = keras.ops.convert_to_tensor(
+    ... [[0.1, 0.4, 0.6, 0.9, 0.5],
+    ...  [0.1, 0.7, 0.9, 0.8, 0.3],
+    ...  [0.1, 0.6, 0.9, 0.9, 0.5]])
+    >>> in_top_k(targets, predictions, k=3)
+    array([ True False  True], shape=(3,), dtype=bool)
+    """
+    if any_symbolic_tensors((targets, predictions)):
+        return InTopK(k).symbolic_call(targets, predictions)
+    return backend.math.in_top_k(targets, predictions, k)
+
+
+class Logsumexp(Operation):
+    def __init__(self, axis=None, keepdims=False):
+        super().__init__()
+        self.axis = axis
+        self.keepdims = keepdims
+
+    def compute_output_spec(self, x):
+        output_shape = reduce_shape(x.shape, self.axis, self.keepdims)
+        return KerasTensor(shape=output_shape)
+
+    def call(self, x):
+        return backend.math.logsumexp(x, axis=self.axis, keepdims=self.keepdims)
+
+
+@keras_export("keras.ops.logsumexp")
+def logsumexp(x, axis=None, keepdims=False):
+    """Computes the logarithm of sum of exponentials of elements in a tensor.
+
+    Args:
+        x: Input tensor.
+        axis: An integer or a tuple of integers specifying the axis/axes
+            along which to compute the sum. If `None`, the sum is computed
+            over all elements. Defaults to `None`.
+        keepdims: A boolean indicating whether to keep the dimensions of
+            the input tensor when computing the sum. Defaults to `False`.
+
+    Returns:
+        A tensor containing the logarithm of the sum of exponentials of
+        elements in `x`.
+
+    Example:
+
+    >>> x = keras.ops.convert_to_tensor([1., 2., 3.])
+    >>> logsumexp(x)
+    3.407606
+    """
+    if any_symbolic_tensors((x,)):
+        return Logsumexp(axis, keepdims).symbolic_call(x)
+    return backend.math.logsumexp(x, axis=axis, keepdims=keepdims)
+
+
+class ExtractSequences(Operation):
+    def __init__(self, sequence_length, sequence_stride):
+        super().__init__()
+        self.sequence_length = sequence_length
+        self.sequence_stride = sequence_stride
+
+    def compute_output_spec(self, x):
+        if len(x.shape) < 1:
+            raise ValueError(
+                f"Input should have rank >= 1. "
+                f"Received: input.shape = {x.shape}"
+            )
+        if x.shape[-1] is not None:
+            num_sequences = (
+                1 + (x.shape[-1] - self.sequence_length) // self.sequence_stride
+            )
+        else:
+            num_sequences = None
+        new_shape = x.shape[:-1] + (num_sequences, self.sequence_length)
+        return KerasTensor(shape=new_shape, dtype=x.dtype)
+
+    def call(self, x):
+        return backend.math.extract_sequences(
+            x,
+            sequence_length=self.sequence_length,
+            sequence_stride=self.sequence_stride,
+        )
+
+
+@keras_export("keras.ops.extract_sequences")
+def extract_sequences(x, sequence_length, sequence_stride):
+    """Expands the dimension of last axis into sequences of `sequence_length`.
+
+    Slides a window of size `sequence_length` over the last axis of the input
+    with a stride of `sequence_stride`, replacing the last axis with
+    `[num_sequences, sequence_length]` sequences.
+
+    If the dimension along the last axis is N, the number of sequences can be
+    computed by:
+
+    `num_sequences = 1 + (N - sequence_length) // sequence_stride`
+
+    Args:
+        x: Input tensor.
+        sequence_length: An integer representing the sequences length.
+        sequence_stride: An integer representing the sequences hop size.
+
+    Returns:
+        A tensor of sequences with shape [..., num_sequences, sequence_length].
+
+    Example:
+
+    >>> x = keras.ops.convert_to_tensor([1, 2, 3, 4, 5, 6])
+    >>> extract_sequences(x, 3, 2)
+    array([[1, 2, 3],
+       [3, 4, 5]])
+    """
+    if any_symbolic_tensors((x,)):
+        return ExtractSequences(sequence_length, sequence_stride).symbolic_call(
+            x
+        )
+    return backend.math.extract_sequences(x, sequence_length, sequence_stride)
+
+
+class FFT(Operation):
+    def __init__(self, axis=-1):
+        super().__init__()
+        self.axis = axis
+
+    def compute_output_spec(self, x):
+        if not isinstance(x, (tuple, list)) or len(x) != 2:
+            raise ValueError(
+                "Input `x` should be a tuple of two tensors - real and "
+                f"imaginary. Received: x={x}"
+            )
+
+        real, imag = x
+        # Both real and imaginary parts should have the same shape.
+        if real.shape != imag.shape:
+            raise ValueError(
+                "Input `x` should be a tuple of two tensors - real and "
+                "imaginary. Both the real and imaginary parts should have the "
+                f"same shape. Received: x[0].shape = {real.shape}, "
+                f"x[1].shape = {imag.shape}"
+            )
+
+        # We are calculating 1D FFT. Hence, rank >= 1.
+        if len(real.shape) < 1:
+            raise ValueError(
+                f"Input should have rank >= 1. "
+                f"Received: input.shape = {real.shape}"
+            )
+
+        # The axis along which we are calculating FFT should be fully-defined.
+        m = real.shape[-1]
+        if m is None:
+            raise ValueError(
+                f"Input should have its {self.axis}th axis fully-defined. "
+                f"Received: input.shape = {real.shape}"
+            )
+
+        return (
+            KerasTensor(shape=real.shape, dtype=real.dtype),
+            KerasTensor(shape=imag.shape, dtype=imag.dtype),
+        )
+
+    def call(self, x):
+        return backend.math.fft(x)
+
+
+@keras_export("keras.ops.fft")
+def fft(x):
+    """Computes the Fast Fourier Transform along last axis of input.
+
+    Args:
+        x: Tuple of the real and imaginary parts of the input tensor. Both
+            tensors in the tuple should be of floating type.
+
+    Returns:
+        A tuple containing two tensors - the real and imaginary parts of the
+        output tensor.
+
+    Example:
+
+    >>> x = (
+    ...     keras.ops.convert_to_tensor([1., 2.]),
+    ...     keras.ops.convert_to_tensor([0., 1.]),
+    ... )
+    >>> fft(x)
+    (array([ 3., -1.], dtype=float32), array([ 1., -1.], dtype=float32))
+    """
+    if any_symbolic_tensors(x):
+        return FFT().symbolic_call(x)
+    return backend.math.fft(x)
+
+
+class FFT2(Operation):
+    def __init__(self):
+        super().__init__()
+        self.axes = (-2, -1)
+
+    def compute_output_spec(self, x):
+        if not isinstance(x, (tuple, list)) or len(x) != 2:
+            raise ValueError(
+                "Input `x` should be a tuple of two tensors - real and "
+                f"imaginary. Received: x={x}"
+            )
+
+        real, imag = x
+        # Both real and imaginary parts should have the same shape.
+        if real.shape != imag.shape:
+            raise ValueError(
+                "Input `x` should be a tuple of two tensors - real and "
+                "imaginary. Both the real and imaginary parts should have the "
+                f"same shape. Received: x[0].shape = {real.shape}, "
+                f"x[1].shape = {imag.shape}"
+            )
+        # We are calculating 2D FFT. Hence, rank >= 2.
+        if len(real.shape) < 2:
+            raise ValueError(
+                f"Input should have rank >= 2. "
+                f"Received: input.shape = {real.shape}"
+            )
+
+        # The axes along which we are calculating FFT should be fully-defined.
+        m = real.shape[self.axes[0]]
+        n = real.shape[self.axes[1]]
+        if m is None or n is None:
+            raise ValueError(
+                f"Input should have its {self.axes} axes fully-defined. "
+                f"Received: input.shape = {real.shape}"
+            )
+
+        return (
+            KerasTensor(shape=real.shape, dtype=real.dtype),
+            KerasTensor(shape=imag.shape, dtype=imag.dtype),
+        )
+
+    def call(self, x):
+        return backend.math.fft2(x)
+
+
+@keras_export("keras.ops.fft2")
+def fft2(x):
+    """Computes the 2D Fast Fourier Transform along the last two axes of input.
+
+    Args:
+        x: Tuple of the real and imaginary parts of the input tensor. Both
+            tensors in the tuple should be of floating type.
+
+    Returns:
+        A tuple containing two tensors - the real and imaginary parts of the
+        output.
+
+    Example:
+
+    >>> x = (
+    ...     keras.ops.convert_to_tensor([[1., 2.], [2., 1.]]),
+    ...     keras.ops.convert_to_tensor([[0., 1.], [1., 0.]]),
+    ... )
+    >>> fft2(x)
+    (array([[ 6.,  0.],
+        [ 0., -2.]], dtype=float32), array([[ 2.,  0.],
+        [ 0., -2.]], dtype=float32))
+    """
+    if any_symbolic_tensors(x):
+        return FFT2().symbolic_call(x)
+    return backend.math.fft2(x)
+
+
+class IFFT2(Operation):
+    def __init__(self):
+        super().__init__()
+        self.axes = (-2, -1)
+
+    def compute_output_spec(self, x):
+        if not isinstance(x, (tuple, list)) or len(x) != 2:
+            raise ValueError(
+                "Input `x` should be a tuple of two tensors - real and "
+                f"imaginary. Received: x={x}"
+            )
+
+        real, imag = x
+        # Both real and imaginary parts should have the same shape.
+        if real.shape != imag.shape:
+            raise ValueError(
+                "Input `x` should be a tuple of two tensors - real and "
+                "imaginary. Both the real and imaginary parts should have the "
+                f"same shape. Received: x[0].shape = {real.shape}, "
+                f"x[1].shape = {imag.shape}"
+            )
+        # We are calculating 2D IFFT. Hence, rank >= 2.
+        if len(real.shape) < 2:
+            raise ValueError(
+                f"Input should have rank >= 2. "
+                f"Received: input.shape = {real.shape}"
+            )
+
+        # The axes along which we are calculating IFFT should be fully-defined.
+        m = real.shape[self.axes[0]]
+        n = real.shape[self.axes[1]]
+        if m is None or n is None:
+            raise ValueError(
+                f"Input should have its {self.axes} axes fully-defined. "
+                f"Received: input.shape = {real.shape}"
+            )
+
+        return (
+            KerasTensor(shape=real.shape, dtype=real.dtype),
+            KerasTensor(shape=imag.shape, dtype=imag.dtype),
+        )
+
+    def call(self, x):
+        return backend.math.ifft2(x)
+
+
+@keras_export("keras.ops.ifft2")
+def ifft2(x):
+    """Computes the 2D Inverse Fast Fourier Transform along the last two axes of
+        input.
+
+    Args:
+        x: Tuple of the real and imaginary parts of the input tensor. Both
+            tensors in the tuple should be of floating type.
+
+    Returns:
+        A tuple containing two tensors - the real and imaginary parts of the
+        output.
+
+    Example:
+
+    >>> x = (
+    ...     keras.ops.convert_to_tensor([[1., 2.], [2., 1.]]),
+    ...     keras.ops.convert_to_tensor([[0., 1.], [1., 0.]]),
+    ... )
+    >>> ifft2(x)
+    (array([[ 6.,  0.],
+        [ 0., -2.]], dtype=float32), array([[ 2.,  0.],
+        [ 0., -2.]], dtype=float32))
+    """
+    if any_symbolic_tensors(x):
+        return IFFT2().symbolic_call(x)
+    return backend.math.ifft2(x)
+
+
+class RFFT(Operation):
+    def __init__(self, fft_length=None):
+        super().__init__()
+        self.fft_length = fft_length
+
+    def compute_output_spec(self, x):
+        # We are calculating 1D RFFT. Hence, rank >= 1.
+        if len(x.shape) < 1:
+            raise ValueError(
+                f"Input should have rank >= 1. "
+                f"Received: input.shape = {x.shape}"
+            )
+
+        if self.fft_length is not None:
+            new_last_dimension = self.fft_length // 2 + 1
+        else:
+            if x.shape[-1] is not None:
+                new_last_dimension = x.shape[-1] // 2 + 1
+            else:
+                new_last_dimension = None
+        new_shape = x.shape[:-1] + (new_last_dimension,)
+
+        return (
+            KerasTensor(shape=new_shape, dtype=x.dtype),
+            KerasTensor(shape=new_shape, dtype=x.dtype),
+        )
+
+    def call(self, x):
+        return backend.math.rfft(x, fft_length=self.fft_length)
+
+
+@keras_export("keras.ops.rfft")
+def rfft(x, fft_length=None):
+    """Real-valued Fast Fourier Transform along the last axis of the input.
+
+    Computes the 1D Discrete Fourier Transform of a real-valued signal over the
+    inner-most dimension of input.
+
+    Since the Discrete Fourier Transform of a real-valued signal is
+    Hermitian-symmetric, RFFT only returns the `fft_length / 2 + 1` unique
+    components of the FFT: the zero-frequency term, followed by the
+    `fft_length / 2` positive-frequency terms.
+
+    Along the axis RFFT is computed on, if `fft_length` is smaller than the
+    corresponding dimension of the input, the dimension is cropped. If it is
+    larger, the dimension is padded with zeros.
+
+    Args:
+        x: Input tensor.
+        fft_length: An integer representing the number of the fft length. If not
+            specified, it is inferred from the length of the last axis of `x`.
+            Defaults to `None`.
+
+    Returns:
+        A tuple containing two tensors - the real and imaginary parts of the
+        output.
+
+    Examples:
+
+    >>> x = keras.ops.convert_to_tensor([0.0, 1.0, 2.0, 3.0, 4.0])
+    >>> rfft(x)
+    (array([10.0, -2.5, -2.5]), array([0.0, 3.4409548, 0.81229924]))
+
+    >>> rfft(x, 3)
+    (array([3.0, -1.5]), array([0.0, 0.8660254]))
+    """
+    if any_symbolic_tensors((x,)):
+        return RFFT(fft_length).symbolic_call(x)
+    return backend.math.rfft(x, fft_length)
+
+
+class IRFFT(Operation):
+    def __init__(self, fft_length=None):
+        super().__init__()
+        self.fft_length = fft_length
+
+    def compute_output_spec(self, x):
+        if not isinstance(x, (tuple, list)) or len(x) != 2:
+            raise ValueError(
+                "Input `x` should be a tuple of two tensors - real and "
+                f"imaginary. Received: x={x}"
+            )
+        real, imag = x
+        # Both real and imaginary parts should have the same shape.
+        if real.shape != imag.shape:
+            raise ValueError(
+                "Input `x` should be a tuple of two tensors - real and "
+                "imaginary. Both the real and imaginary parts should have the "
+                f"same shape. Received: x[0].shape = {real.shape}, "
+                f"x[1].shape = {imag.shape}"
+            )
+        # We are calculating 1D IRFFT. Hence, rank >= 1.
+        if len(real.shape) < 1:
+            raise ValueError(
+                f"Input should have rank >= 1. "
+                f"Received: input.shape = {real.shape}"
+            )
+
+        if self.fft_length is not None:
+            new_last_dimension = self.fft_length
+        else:
+            if real.shape[-1] is not None:
+                new_last_dimension = 2 * (real.shape[-1] - 1)
+            else:
+                new_last_dimension = None
+        new_shape = real.shape[:-1] + (new_last_dimension,)
+        return KerasTensor(shape=new_shape, dtype=real.dtype)
+
+    def call(self, x):
+        return backend.math.irfft(x, fft_length=self.fft_length)
+
+
+@keras_export("keras.ops.irfft")
+def irfft(x, fft_length=None):
+    """Inverse real-valued Fast Fourier transform along the last axis.
+
+    Computes the inverse 1D Discrete Fourier Transform of a real-valued signal
+    over the inner-most dimension of input.
+
+    The inner-most dimension of the input is assumed to be the result of RFFT:
+    the `fft_length / 2 + 1` unique components of the DFT of a real-valued
+    signal. If `fft_length` is not provided, it is computed from the size of the
+    inner-most dimension of the input `(fft_length = 2 * (inner - 1))`. If the
+    FFT length used to compute is odd, it should be provided since it cannot
+    be inferred properly.
+
+    Along the axis IRFFT is computed on, if `fft_length / 2 + 1` is smaller than
+    the corresponding dimension of the input, the dimension is cropped. If it is
+    larger, the dimension is padded with zeros.
+
+    Args:
+        x: Tuple of the real and imaginary parts of the input tensor. Both
+            tensors in the tuple should be of floating type.
+        fft_length: An integer representing the number of the fft length. If not
+            specified, it is inferred from the length of the last axis of `x`.
+            Defaults to `None`.
+
+    Returns:
+        A tensor containing the inverse real-valued Fast Fourier Transform
+        along the last axis of `x`.
+
+    Examples:
+
+    >>> real = keras.ops.convert_to_tensor([0.0, 1.0, 2.0, 3.0, 4.0])
+    >>> imag = keras.ops.convert_to_tensor([0.0, 1.0, 2.0, 3.0, 4.0])
+    >>> irfft((real, imag))
+    array([0.66666667, -0.9106836, 0.24401694])
+
+    >>> irfft(rfft(real, 5), 5)
+    array([0.0, 1.0, 2.0, 3.0, 4.0])
+    """
+    if any_symbolic_tensors(x):
+        return IRFFT(fft_length).symbolic_call(x)
+    return backend.math.irfft(x, fft_length)
+
+
+class STFT(Operation):
+    def __init__(
+        self,
+        sequence_length,
+        sequence_stride,
+        fft_length,
+        window="hann",
+        center=True,
+    ):
+        super().__init__()
+        self.sequence_length = sequence_length
+        self.sequence_stride = sequence_stride
+        self.fft_length = fft_length
+        self.window = window
+        self.center = center
+
+    def compute_output_spec(self, x):
+        if x.shape[-1] is not None:
+            padded = 0 if self.center is False else (self.fft_length // 2) * 2
+            num_sequences = (
+                1
+                + (x.shape[-1] + padded - self.fft_length)
+                // self.sequence_stride
+            )
+        else:
+            num_sequences = None
+        new_shape = x.shape[:-1] + (num_sequences, self.fft_length // 2 + 1)
+        return (
+            KerasTensor(shape=new_shape, dtype=x.dtype),
+            KerasTensor(shape=new_shape, dtype=x.dtype),
+        )
+
+    def call(self, x):
+        return backend.math.stft(
+            x,
+            sequence_length=self.sequence_length,
+            sequence_stride=self.sequence_stride,
+            fft_length=self.fft_length,
+            window=self.window,
+            center=self.center,
+        )
+
+
+@keras_export("keras.ops.stft")
+def stft(
+    x, sequence_length, sequence_stride, fft_length, window="hann", center=True
+):
+    """Short-Time Fourier Transform along the last axis of the input.
+
+    The STFT computes the Fourier transform of short overlapping windows of the
+    input. This giving frequency components of the signal as they change over
+    time.
+
+    Args:
+        x: Input tensor.
+        sequence_length: An integer representing the sequence length.
+        sequence_stride: An integer representing the sequence hop size.
+        fft_length: An integer representing the size of the FFT to apply. If not
+            specified, uses the smallest power of 2 enclosing `sequence_length`.
+        window: A string, a tensor of the window or `None`. If `window` is a
+            string, available values are `"hann"` and `"hamming"`. If `window`
+            is a tensor, it will be used directly as the window and its length
+            must be `sequence_length`. If `window` is `None`, no windowing is
+            used. Defaults to `"hann"`.
+        center: Whether to pad `x` on both sides so that the t-th sequence is
+            centered at time `t * sequence_stride`. Otherwise, the t-th sequence
+            begins at time `t * sequence_stride`. Defaults to `True`.
+
+    Returns:
+        A tuple containing two tensors - the real and imaginary parts of the
+        STFT output.
+
+    Example:
+
+    >>> x = keras.ops.convert_to_tensor([0.0, 1.0, 2.0, 3.0, 4.0])
+    >>> stft(x, 3, 2, 3)
+    (array([[0.75, -0.375],
+       [3.75, -1.875],
+       [5.25, -2.625]]), array([[0.0, 0.64951905],
+       [0.0, 0.64951905],
+       [0.0, -0.64951905]]))
+    """
+    if any_symbolic_tensors((x,)):
+        return STFT(
+            sequence_length=sequence_length,
+            sequence_stride=sequence_stride,
+            fft_length=fft_length,
+            window=window,
+            center=center,
+        ).symbolic_call(x)
+    return backend.math.stft(
+        x,
+        sequence_length=sequence_length,
+        sequence_stride=sequence_stride,
+        fft_length=fft_length,
+        window=window,
+        center=center,
+    )
+
+
+class ISTFT(Operation):
+    def __init__(
+        self,
+        sequence_length,
+        sequence_stride,
+        fft_length,
+        length=None,
+        window="hann",
+        center=True,
+    ):
+        super().__init__()
+        self.sequence_length = sequence_length
+        self.sequence_stride = sequence_stride
+        self.fft_length = fft_length
+        self.length = length
+        self.window = window
+        self.center = center
+
+    def compute_output_spec(self, x):
+        if not isinstance(x, (tuple, list)) or len(x) != 2:
+            raise ValueError(
+                "Input `x` should be a tuple of two tensors - real and "
+                f"imaginary. Received: x={x}"
+            )
+        real, imag = x
+        # Both real and imaginary parts should have the same shape.
+        if real.shape != imag.shape:
+            raise ValueError(
+                "Input `x` should be a tuple of two tensors - real and "
+                "imaginary. Both the real and imaginary parts should have the "
+                f"same shape. Received: x[0].shape = {real.shape}, "
+                f"x[1].shape = {imag.shape}"
+            )
+        if len(real.shape) < 2:
+            raise ValueError(
+                f"Input should have rank >= 2. "
+                f"Received: input.shape = {real.shape}"
+            )
+        if real.shape[-2] is not None:
+            output_size = (
+                real.shape[-2] - 1
+            ) * self.sequence_stride + self.fft_length
+            if self.length is not None:
+                output_size = self.length
+            elif self.center:
+                output_size = output_size - (self.fft_length // 2) * 2
+        else:
+            output_size = None
+        new_shape = real.shape[:-2] + (output_size,)
+        return KerasTensor(shape=new_shape, dtype=real.dtype)
+
+    def call(self, x):
+        return backend.math.istft(
+            x,
+            sequence_length=self.sequence_length,
+            sequence_stride=self.sequence_stride,
+            fft_length=self.fft_length,
+            length=self.length,
+            window=self.window,
+            center=self.center,
+        )
+
+
+@keras_export("keras.ops.istft")
+def istft(
+    x,
+    sequence_length,
+    sequence_stride,
+    fft_length,
+    length=None,
+    window="hann",
+    center=True,
+):
+    """Inverse Short-Time Fourier Transform along the last axis of the input.
+
+    To reconstruct an original waveform, the parameters should be the same in
+    `stft`.
+
+    Args:
+        x: Tuple of the real and imaginary parts of the input tensor. Both
+            tensors in the tuple should be of floating type.
+        sequence_length: An integer representing the sequence length.
+        sequence_stride: An integer representing the sequence hop size.
+        fft_length: An integer representing the size of the FFT that produced
+            `stft`. Should be of type `int32`.
+        length: An integer representing the output is clipped to exactly length.
+            If not specified, no padding or clipping take place. Defaults to
+            `None`.
+        window: A string, a tensor of the window or `None`. If `window` is a
+            string, available values are `"hann"` and `"hamming"`. If `window`
+            is a tensor, it will be used directly as the window and its length
+            must be `sequence_length`. If `window` is `None`, no windowing is
+            used. Defaults to `"hann"`.
+        center: Whether `x` was padded on both sides so that the t-th sequence
+            is centered at time `t * sequence_stride`. Defaults to `True`.
+
+    Returns:
+        A tensor containing the inverse Short-Time Fourier Transform along the
+        last axis of `x`.
+
+    Example:
+
+    >>> x = keras.ops.convert_to_tensor([0.0, 1.0, 2.0, 3.0, 4.0])
+    >>> istft(stft(x, 1, 1, 1), 1, 1, 1)
+    array([0.0, 1.0, 2.0, 3.0, 4.0])
+    """
+    if any_symbolic_tensors(x):
+        return ISTFT(
+            sequence_length=sequence_length,
+            sequence_stride=sequence_stride,
+            fft_length=fft_length,
+            window=window,
+            center=center,
+        ).symbolic_call(x)
+    return backend.math.istft(
+        x,
+        sequence_length=sequence_length,
+        sequence_stride=sequence_stride,
+        fft_length=fft_length,
+        length=length,
+        window=window,
+        center=center,
+    )
+
+
+class Rsqrt(Operation):
+    def call(self, x):
+        x = backend.convert_to_tensor(x)
+        return backend.math.rsqrt(x)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export("keras.ops.rsqrt")
+def rsqrt(x):
+    """Computes reciprocal of square root of x element-wise.
+
+    Args:
+        x: input tensor
+
+    Returns:
+        A tensor with the same dtype as `x`.
+
+    Example:
+
+    >>> x = keras.ops.convert_to_tensor([1.0, 10.0, 100.0])
+    >>> keras.ops.rsqrt(x)
+    array([1.0, 0.31622776, 0.1], dtype=float32)
+    """
+    if any_symbolic_tensors((x,)):
+        return Rsqrt().symbolic_call(x)
+    x = backend.convert_to_tensor(x)
+    return backend.math.rsqrt(x)
+
+
+class Erf(Operation):
+    def compute_output_spec(self, x):
+        return KerasTensor(shape=x.shape, dtype=x.dtype)
+
+    def call(self, x):
+        return backend.math.erf(x)
+
+
+@keras_export("keras.ops.erf")
+def erf(x):
+    """Computes the error function of `x`, element-wise.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        A tensor with the same dtype as `x`.
+
+    Example:
+
+    >>> x = np.array([-3.0, -2.0, -1.0, 0.0, 1.0])
+    >>> keras.ops.erf(x)
+    array([-0.99998 , -0.99532, -0.842701,  0.,  0.842701], dtype=float32)
+    """
+    if any_symbolic_tensors((x,)):
+        return Erf().symbolic_call(x)
+    x = backend.convert_to_tensor(x)
+    return backend.math.erf(x)
+
+
+class Erfinv(Operation):
+    def compute_output_spec(self, x):
+        return KerasTensor(shape=x.shape, dtype=x.dtype)
+
+    def call(self, x):
+        return backend.math.erfinv(x)
+
+
+@keras_export("keras.ops.erfinv")
+def erfinv(x):
+    """Computes the inverse error function of `x`, element-wise.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        A tensor with the same dtype as `x`.
+
+    Example:
+
+    >>> x = np.array([-0.5, -0.2, -0.1, 0.0, 0.3])
+    >>> keras.ops.erfinv(x)
+    array([-0.47694, -0.17914, -0.08886,  0. ,  0.27246], dtype=float32)
+    """
+    if any_symbolic_tensors((x,)):
+        return Erfinv().symbolic_call(x)
+    x = backend.convert_to_tensor(x)
+    return backend.math.erfinv(x)
+
+
+class Logdet(Operation):
+    def __init__(self):
+        super().__init__()
+
+    def call(self, x):
+        return backend.math.logdet(x)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape[:-2], dtype=x.dtype)
+
+
+@keras_export(["keras.ops.logdet"])
+def logdet(x):
+    """Computes log of the determinant of a hermitian positive definite matrix.
+
+    Args:
+        x: Input matrix. It must 2D and square.
+
+    Returns:
+        The natural log of the determinant of matrix.
+    """
+    if any_symbolic_tensors((x,)):
+        return Logdet().symbolic_call(x)
+    return backend.math.logdet(x)
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/nn.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/nn.py
new file mode 100644
index 0000000000000000000000000000000000000000..4bbd0469f264f48452b15cda903a5bfb75bf3da9
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/nn.py
@@ -0,0 +1,2653 @@
+"""Commonly-used neural network operations not included in NumPy."""
+
+import warnings
+
+from keras.src import backend
+from keras.src.api_export import keras_export
+from keras.src.backend import KerasTensor
+from keras.src.backend import any_symbolic_tensors
+from keras.src.backend import standardize_data_format
+from keras.src.backend.common.backend_utils import (
+    compute_conv_transpose_output_shape,
+)
+from keras.src.ops import operation_utils
+from keras.src.ops.operation import Operation
+from keras.src.ops.operation_utils import reduce_shape
+
+
+class Relu(Operation):
+    def call(self, x):
+        return backend.nn.relu(x)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.relu", "keras.ops.nn.relu"])
+def relu(x):
+    """Rectified linear unit activation function.
+
+    It is defined as `f(x) = max(0, x)`.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        A tensor with the same shape as `x`.
+
+    Example:
+
+    >>> x1 = keras.ops.convert_to_tensor([-1.0, 0.0, 1.0, 0.2])
+    >>> keras.ops.relu(x1)
+    array([0.0, 0.0, 1.0, 0.2], dtype=float32)
+    """
+    if any_symbolic_tensors((x,)):
+        return Relu().symbolic_call(x)
+    return backend.nn.relu(x)
+
+
+class Relu6(Operation):
+    def call(self, x):
+        return backend.nn.relu6(x)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.relu6", "keras.ops.nn.relu6"])
+def relu6(x):
+    """Rectified linear unit activation function with upper bound of 6.
+
+    It is defined as `f(x) = np.clip(x, 0, 6)`.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        A tensor with the same shape as `x`.
+
+    Example:
+
+    >>> x = keras.ops.convert_to_tensor([-3.0, -2.0, 0.1, 0.2, 6.0, 8.0])
+    >>> keras.ops.relu6(x)
+    array([0.0, 0.0, 0.1, 0.2, 6.0, 6.0], dtype=float32)
+    """
+    if any_symbolic_tensors((x,)):
+        return Relu6().symbolic_call(x)
+    return backend.nn.relu6(x)
+
+
+class Sigmoid(Operation):
+    def call(self, x):
+        return backend.nn.sigmoid(x)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.sigmoid", "keras.ops.nn.sigmoid"])
+def sigmoid(x):
+    """Sigmoid activation function.
+
+    It is defined as `f(x) = 1 / (1 + exp(-x))`.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        A tensor with the same shape as `x`.
+
+    Example:
+
+    >>> x = keras.ops.convert_to_tensor([-6.0, 1.0, 0.0, 1.0, 6.0])
+    >>> keras.ops.sigmoid(x)
+    array([0.00247262, 0.7310586, 0.5, 0.7310586, 0.9975274], dtype=float32)
+
+    """
+    if any_symbolic_tensors((x,)):
+        return Sigmoid().symbolic_call(x)
+    return backend.nn.sigmoid(x)
+
+
+class Softplus(Operation):
+    def call(self, x):
+        return backend.nn.softplus(x)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.softplus", "keras.ops.nn.softplus"])
+def softplus(x):
+    """Softplus activation function.
+
+    It is defined as `f(x) = log(exp(x) + 1)`, where `log` is the natural
+    logarithm and `exp` is the exponential function.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        A tensor with the same shape as `x`.
+
+    Example:
+
+    >>> x = keras.ops.convert_to_tensor([-0.555, 0.0, 0.555])
+    >>> keras.ops.softplus(x)
+    array([0.45366603, 0.6931472, 1.008666], dtype=float32)
+
+    """
+    if any_symbolic_tensors((x,)):
+        return Softplus().symbolic_call(x)
+    return backend.nn.softplus(x)
+
+
+class Softsign(Operation):
+    def call(self, x):
+        return backend.nn.softsign(x)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.softsign", "keras.ops.nn.softsign"])
+def softsign(x):
+    """Softsign activation function.
+
+    It is defined as `f(x) = x / (abs(x) + 1)`.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        A tensor with the same shape as `x`.
+
+    Example:
+
+    >>> x = keras.ops.convert_to_tensor([-0.100, -10.0, 1.0, 0.0, 100.0])
+    >>> keras.ops.softsign(x)
+    Array([-0.09090909, -0.90909094, 0.5, 0.0, 0.990099], dtype=float32)
+
+    """
+    if any_symbolic_tensors((x,)):
+        return Softsign().symbolic_call(x)
+    return backend.nn.softsign(x)
+
+
+class SoftShrink(Operation):
+    def __init__(self, threshold=0.5):
+        super().__init__()
+        self.threshold = threshold
+
+    def call(self, x):
+        return backend.nn.soft_shrink(x, self.threshold)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.soft_shrink", "keras.ops.nn.soft_shrink"])
+def soft_shrink(x, threshold=0.5):
+    """Soft Shrink activation function.
+
+    It is defined as
+
+    `f(x) = x - threshold` if `x > threshold`,
+    `f(x) = x + threshold` if `x < -threshold`,
+    `f(x) = 0` otherwise.
+
+    Args:
+        x: Input tensor.
+        threshold: Threshold value. Defaults to 0.5.
+
+    Returns:
+        A tensor with the same shape as `x`.
+
+    Example:
+
+    >>> x = np.array([-1.0, 0.0, 1.0])
+    >>> x_soft_shrink = keras.ops.soft_shrink(x)
+    >>> print(x_soft_shrink)
+    array([-0.5  0.   0.5], shape=(3,), dtype=float64)
+
+    """
+    if any_symbolic_tensors((x,)):
+        return SoftShrink(threshold).symbolic_call(x)
+    return backend.nn.soft_shrink(x, threshold)
+
+
+class SparsePlus(Operation):
+    def call(self, x):
+        return backend.nn.sparse_plus(x)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.sparse_plus", "keras.ops.nn.sparse_plus"])
+def sparse_plus(x):
+    """SparsePlus activation function.
+
+    It is defined as
+
+    `f(x) = 0` for `x <= -1`.
+    `f(x) = (1/4) * (x + 1)^2` for `-1 < x < 1`.
+    `f(x) = x` for `x >= 1`.
+
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        A tensor with the same shape as `x`.
+
+    Example:
+
+    >>> x = np.array([-1.0, 0.0, 1.0])
+    >>> x_sparse_plus = keras.ops.sparse_plus(x)
+    >>> print(x_sparse_plus)
+    Array([0.   0.25 1.  ], shape=(3,), dtype=float32)
+
+    """
+    if any_symbolic_tensors((x,)):
+        return SparsePlus().symbolic_call(x)
+    return backend.nn.sparse_plus(x)
+
+
+class Silu(Operation):
+    def call(self, x):
+        return backend.nn.silu(x)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(
+    [
+        "keras.ops.silu",
+        "keras.ops.nn.silu",
+        "keras.ops.swish",
+        "keras.ops.nn.swish",
+    ]
+)
+def silu(x):
+    """Sigmoid Linear Unit (SiLU) activation function, also known as Swish.
+
+    The SiLU activation function is computed by the sigmoid function multiplied
+    by its input. It is defined as `f(x) = x * sigmoid(x)`.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        A tensor with the same shape as `x`.
+
+    Example:
+
+    >>> x = keras.ops.convert_to_tensor([-6.0, 1.0, 0.0, 1.0, 6.0])
+    >>> keras.ops.sigmoid(x)
+    array([0.00247262, 0.7310586, 0.5, 0.7310586, 0.9975274], dtype=float32)
+    >>> keras.ops.silu(x)
+    array([-0.0148357, 0.7310586, 0.0, 0.7310586, 5.9851646], dtype=float32)
+
+    """
+    if any_symbolic_tensors((x,)):
+        return Silu().symbolic_call(x)
+    return backend.nn.silu(x)
+
+
+class Squareplus(Operation):
+    def __init__(self, b=4):
+        super().__init__()
+        self.b = b
+
+    def call(self, x):
+        return backend.nn.squareplus(x, self.b)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.squareplus", "keras.ops.nn.squareplus"])
+def squareplus(x, b=4):
+    """Squareplus activation function.
+
+    The Squareplus activation function is defined as:
+
+    `f(x) = (x + sqrt(x^2 + b)) / 2`
+
+    Args:
+        x: Input tensor.
+        b: Smoothness parameter. Defaults to 4.
+
+    Returns:
+        A tensor with the same shape as `x`.
+
+    Example:
+
+    >>> x = np.array([-1.0, 0.0, 1.0])
+    >>> x_squareplus = keras.ops.squareplus(x)
+    >>> print(x_squareplus)
+    array([0.6180, 1.0000, 1.6180], dtype=float32)
+
+    """
+    if any_symbolic_tensors((x,)):
+        return Squareplus(b).symbolic_call(x)
+    return backend.nn.squareplus(x, b)
+
+
+class LogSigmoid(Operation):
+    def call(self, x):
+        return backend.nn.log_sigmoid(x)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(
+    [
+        "keras.ops.log_sigmoid",
+        "keras.ops.nn.log_sigmoid",
+    ]
+)
+def log_sigmoid(x):
+    """Logarithm of the sigmoid activation function.
+
+    It is defined as `f(x) = log(1 / (1 + exp(-x)))`.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        A tensor with the same shape as `x`.
+
+    Example:
+
+    >>> x = keras.ops.convert_to_tensor([-0.541391, 0.0, 0.50, 5.0])
+    >>> keras.ops.log_sigmoid(x)
+    array([-1.0000418, -0.6931472, -0.474077, -0.00671535], dtype=float32)
+
+    """
+    if any_symbolic_tensors((x,)):
+        return LogSigmoid().symbolic_call(x)
+    return backend.nn.log_sigmoid(x)
+
+
+class LeakyRelu(Operation):
+    def __init__(self, negative_slope=0.2):
+        super().__init__()
+        self.negative_slope = negative_slope
+
+    def call(self, x):
+        return backend.nn.leaky_relu(x, self.negative_slope)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.leaky_relu", "keras.ops.nn.leaky_relu"])
+def leaky_relu(x, negative_slope=0.2):
+    """Leaky version of a Rectified Linear Unit activation function.
+
+    It allows a small gradient when the unit is not active, it is defined as:
+
+    `f(x) = alpha * x for x < 0` or `f(x) = x for x >= 0`.
+
+    Args:
+        x: Input tensor.
+        negative_slope: Slope of the activation function at x < 0.
+            Defaults to `0.2`.
+
+    Returns:
+        A tensor with the same shape as `x`.
+
+    Example:
+
+    >>> x = np.array([-1., 0., 1.])
+    >>> x_leaky_relu = keras.ops.leaky_relu(x)
+    >>> print(x_leaky_relu)
+    array([-0.2,  0. ,  1. ], shape=(3,), dtype=float64)
+
+    """
+    if any_symbolic_tensors((x,)):
+        return LeakyRelu(negative_slope).symbolic_call(x)
+    return backend.nn.leaky_relu(x, negative_slope=negative_slope)
+
+
+class HardSigmoid(Operation):
+    def call(self, x):
+        return backend.nn.hard_sigmoid(x)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(
+    [
+        "keras.ops.hard_sigmoid",
+        "keras.ops.nn.hard_sigmoid",
+    ]
+)
+def hard_sigmoid(x):
+    """Hard sigmoid activation function.
+
+    It is defined as:
+
+    `0 if x < -2.5`, `1 if x > 2.5`, `(0.2 * x) + 0.5 if -2.5 <= x <= 2.5`.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        A tensor with the same shape as `x`.
+
+    Example:
+
+    >>> x = np.array([-1., 0., 1.])
+    >>> x_hard_sigmoid = keras.ops.hard_sigmoid(x)
+    >>> print(x_hard_sigmoid)
+    array([0.3, 0.5, 0.7], shape=(3,), dtype=float64)
+
+    """
+    if any_symbolic_tensors((x,)):
+        return HardSigmoid().symbolic_call(x)
+    return backend.nn.hard_sigmoid(x)
+
+
+class HardSilu(Operation):
+    def call(self, x):
+        return backend.nn.hard_silu(x)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(
+    [
+        "keras.ops.hard_silu",
+        "keras.ops.nn.hard_silu",
+        "keras.ops.hard_swish",
+        "keras.ops.nn.hard_swish",
+    ]
+)
+def hard_silu(x):
+    """Hard SiLU activation function, also known as Hard Swish.
+
+    It is defined as:
+
+    - `0` if `if x < -3`
+    - `x` if `x > 3`
+    - `x * (x + 3) / 6` if `-3 <= x <= 3`
+
+    It's a faster, piecewise linear approximation of the silu activation.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        A tensor with the same shape as `x`.
+
+    Example:
+
+    >>> x = keras.ops.convert_to_tensor([-3.0, -1.0, 0.0, 1.0, 3.0])
+    >>> keras.ops.hard_silu(x)
+    array([-0.0, -0.3333333, 0.0, 0.6666667, 3.0], shape=(5,), dtype=float32)
+
+    """
+    if any_symbolic_tensors((x,)):
+        return HardSilu().symbolic_call(x)
+    return backend.nn.hard_silu(x)
+
+
+class Elu(Operation):
+    def __init__(self, alpha=1.0):
+        super().__init__()
+        self.alpha = alpha
+
+    def call(self, x):
+        return backend.nn.elu(x, alpha=self.alpha)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.elu", "keras.ops.nn.elu"])
+def elu(x, alpha=1.0):
+    """Exponential Linear Unit activation function.
+
+    It is defined as:
+
+    `f(x) =  alpha * (exp(x) - 1.) for x < 0`, `f(x) = x for x >= 0`.
+
+    Args:
+        x: Input tensor.
+        alpha: A scalar, slope of positive section. Defaults to `1.0`.
+
+    Returns:
+        A tensor with the same shape as `x`.
+
+    Example:
+
+    >>> x = np.array([-1., 0., 1.])
+    >>> x_elu = keras.ops.elu(x)
+    >>> print(x_elu)
+    array([-0.63212055, 0., 1.], shape=(3,), dtype=float64)
+
+    """
+    if any_symbolic_tensors((x,)):
+        return Elu(alpha).symbolic_call(x)
+    return backend.nn.elu(x, alpha=alpha)
+
+
+class Selu(Operation):
+    def call(self, x):
+        return backend.nn.selu(x)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.selu", "keras.ops.nn.selu"])
+def selu(x):
+    """Scaled Exponential Linear Unit (SELU) activation function.
+
+    It is defined as:
+
+    `f(x) =  scale * alpha * (exp(x) - 1.) for x < 0`,
+    `f(x) = scale * x for x >= 0`.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        A tensor with the same shape as `x`.
+
+    Example:
+
+    >>> x = np.array([-1., 0., 1.])
+    >>> x_selu = keras.ops.selu(x)
+    >>> print(x_selu)
+    array([-1.11133055, 0., 1.05070098], shape=(3,), dtype=float64)
+
+    """
+    if any_symbolic_tensors((x,)):
+        return Selu().symbolic_call(x)
+    return backend.nn.selu(x)
+
+
+class Gelu(Operation):
+    def __init__(self, approximate=True):
+        super().__init__()
+        self.approximate = approximate
+
+    def call(self, x):
+        return backend.nn.gelu(x, self.approximate)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.gelu", "keras.ops.nn.gelu"])
+def gelu(x, approximate=True):
+    """Gaussian Error Linear Unit (GELU) activation function.
+
+    If `approximate` is `True`, it is defined as:
+    `f(x) = 0.5 * x * (1 + tanh(sqrt(2 / pi) * (x + 0.044715 * x^3)))`
+
+    Or if `approximate` is `False`, it is defined as:
+    `f(x) = x * P(X <= x) = 0.5 * x * (1 + erf(x / sqrt(2)))`,
+    where `P(X) ~ N(0, 1)`.
+
+    Args:
+        x: Input tensor.
+        approximate: Approximate version of GELU activation. Defaults to `True`.
+
+    Returns:
+        A tensor with the same shape as `x`.
+
+    Example:
+
+    >>> x = np.array([-1., 0., 1.])
+    >>> x_gelu = keras.ops.gelu(x)
+    >>> print(x_gelu)
+    array([-0.15865525, 0., 0.84134475], shape=(3,), dtype=float64)
+
+    """
+    if any_symbolic_tensors((x,)):
+        return Gelu(approximate).symbolic_call(x)
+    return backend.nn.gelu(x, approximate)
+
+
+class Celu(Operation):
+    def __init__(self, alpha=1.0):
+        super().__init__()
+        self.alpha = alpha
+
+    def call(self, x):
+        return backend.nn.celu(x, self.alpha)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.celu", "keras.ops.nn.celu"])
+def celu(x, alpha=1.0):
+    """Continuously-differentiable exponential linear unit.
+
+    It is defined as:
+
+    `f(x) =  alpha * (exp(x / alpha) - 1) for x < 0`, `f(x) = x for x >= 0`.
+
+    Args:
+        x: Input tensor.
+        alpha: the α value for the CELU formulation. Defaults to `1.0`.
+
+    Returns:
+        A tensor with the same shape as `x`.
+
+    Example:
+
+    >>> x = np.array([-1., 0., 1.])
+    >>> x_celu = keras.ops.celu(x)
+    >>> print(x_celu)
+    array([-0.63212056, 0. , 1. ], shape=(3,), dtype=float64)
+
+    """
+    if any_symbolic_tensors((x,)):
+        return Celu(alpha).symbolic_call(x)
+    return backend.nn.celu(x, alpha)
+
+
+class Glu(Operation):
+    def __init__(self, axis=-1):
+        super().__init__()
+        self.axis = axis
+
+    def call(self, x):
+        return backend.nn.glu(x, axis=self.axis)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.glu", "keras.ops.nn.glu"])
+def glu(x, axis=-1):
+    """Gated Linear Unit (GLU) activation function.
+
+    It is defined as:
+
+    `f(x) = a * sigmoid(b)`
+    where `x` is split into `a` and `b` along the given axis.
+
+    Args:
+        x: Input tensor.
+        axis: The axis along which to split the input tensor. Defaults to `-1`.
+
+    Returns:
+        A tensor with the same shape as half of the input.
+
+    Example:
+
+    >>> x = np.array([-1., 0., 1. , 1.])
+    >>> x_glu = keras.ops.glu(x)
+    >>> print(x_glu)
+    array([-0.73105858, 0. ], shape=(2,), dtype=float64)
+
+    """
+    if any_symbolic_tensors((x,)):
+        return Glu(axis).symbolic_call(x)
+    return backend.nn.glu(x, axis=axis)
+
+
+class TanhShrink(Operation):
+    def __init__(self):
+        super().__init__()
+
+    def call(self, x):
+        return backend.nn.tanh_shrink(x)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.tanh_shrink", "keras.ops.nn.tanh_shrink"])
+def tanh_shrink(x):
+    """Applies the tanh shrink function element-wise.
+
+    It is defined as:
+
+    `f(x) = x - tanh(x)`.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        Output tensor of the same shape as `x`, where each element is
+        transformed according to the tanh shrink operation.
+
+    Example:
+
+    >>> x = np.array([ -1., 0., 1.])
+    >>> x_tanh_shrink = keras.ops.tanh_shrink(x)
+    >>> print(x_tanh_shrink)
+    array([-0.23840584  0.  0.23840584], shape=(3,), dtype=float64)
+
+    """
+    if any_symbolic_tensors((x,)):
+        return TanhShrink().symbolic_call(x)
+    return backend.nn.tanh_shrink(x)
+
+
+class HardTanh(Operation):
+    def __init__(self):
+        super().__init__()
+
+    def call(self, x):
+        return backend.nn.hard_tanh(x)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.hard_tanh", "keras.ops.nn.hard_tanh"])
+def hard_tanh(x):
+    """Applies the HardTanh function element-wise.
+
+    It is defined as:
+
+    `f(x) = -1 for x < -1`, `f(x) = x for -1 <= x <= 1`, `f(x) = 1 for x > 1`.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        Output tensor of same shape as `x`
+        where values are clamped between -1 and 1.
+
+    Example:
+
+    >>> x = np.array([-2., -1., 0., 1., 2.])
+    >>> x_hard_tanh = keras.ops.hard_tanh(x)
+    >>> print(x_hard_tanh)
+    array([-1. -1.  0.  1.  1.], shape=(5,), dtype=float64)
+
+    """
+    if any_symbolic_tensors((x,)):
+        return HardTanh().symbolic_call(x)
+    return backend.nn.hard_tanh(x)
+
+
+class HardShrink(Operation):
+    def __init__(self, threshold=0.5):
+        super().__init__()
+        self.threshold = threshold
+
+    def call(self, x):
+        return backend.nn.hard_shrink(x, self.threshold)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.hard_shrink", "keras.ops.nn.hard_shrink"])
+def hard_shrink(x, threshold=0.5):
+    """Hard Shrink activation function.
+
+    The Hard Shrink function is a thresholding operation defined as:
+
+    `f(x) = x` if `|x| > threshold`,
+    `f(x) = 0` otherwise.
+
+    Args:
+        x: Input tensor.
+        threshold: Threshold value. Defaults to 0.5.
+
+    Returns:
+        A tensor with the same shape as `x`.
+
+    Example:
+
+    >>> x = np.array([-0.5, 0., 1.])
+    >>> x_hard_shrink = keras.ops.hard_shrink(x)
+    >>> print(x_hard_shrink)
+    array([0. 0. 1.], shape=(3,), dtype=float64)
+
+    """
+    if any_symbolic_tensors((x,)):
+        return HardShrink(threshold).symbolic_call(x)
+    return backend.nn.hard_shrink(x, threshold)
+
+
+class Threshold(Operation):
+    def __init__(self, threshold_value, value):
+        super().__init__()
+        self.threshold_value = threshold_value
+        self.value = value
+
+    def call(self, x):
+        return backend.nn.threshold(x, self.threshold_value, self.value)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.threshold", "keras.ops.nn.threshold"])
+def threshold(x, threshold, default_value):
+    """Threshold activation function.
+
+    The function thresholds the input `x` as follows:
+    `f(x) = x` if `x > threshold`,
+    `f(x) = default_value` otherwise.
+
+    Args:
+        x: Input tensor.
+        threshold: The value that decides when to retain or replace x.
+        default_value: Value to assign when `x <= threshold`.
+
+    Returns:
+        A tensor with the same shape as `x`.
+
+    Example:
+
+    >>> x = np.array([-1.0, 0.0, 1.0, 2.0])
+    >>> x_threshold = keras.ops.threshold(x, 1, 0)
+    >>> print(x_threshold)
+    array([0., 0., 0., 2.], shape=(4,), dtype=float64)
+
+    """
+    if any_symbolic_tensors((x,)):
+        return Threshold(threshold, default_value).symbolic_call(x)
+    return backend.nn.threshold(x, threshold, default_value)
+
+
+class Softmax(Operation):
+    def __init__(self, axis=-1):
+        super().__init__()
+        self.axis = axis
+
+    def call(self, x):
+        return backend.nn.softmax(x, axis=self.axis)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.softmax", "keras.ops.nn.softmax"])
+def softmax(x, axis=-1):
+    """Softmax activation function.
+
+    The elements of the output vector lie within the range `(0, 1)`, and their
+    total sum is exactly 1 (excluding the floating point rounding error).
+
+    Each vector is processed independently. The `axis` argument specifies the
+    axis along which the function is applied within the input.
+
+    It is defined as:
+    `f(x) = exp(x) / sum(exp(x))`
+
+    Args:
+        x: Input tensor.
+        axis: Integer, axis along which the softmax is applied.
+
+    Returns:
+        A tensor with the same shape as `x`.
+
+    Example:
+
+    >>> x = np.array([-1., 0., 1.])
+    >>> x_softmax = keras.ops.softmax(x)
+    >>> print(x_softmax)
+    array([0.09003057, 0.24472847, 0.66524096], shape=(3,), dtype=float64)
+
+    """
+    # Don't use `backend.shape` since TensorFlow returns
+    # symbolic tensors for unknown shape which can trigger
+    # an error in TensorFlow graph execution.
+    if isinstance(axis, int) and x.shape[axis] == 1:
+        warnings.warn(
+            f"You are using a softmax over axis {axis} "
+            f"of a tensor of shape {x.shape}. This axis "
+            "has size 1. The softmax operation will always return "
+            "the value 1, which is likely not what you intended. "
+            "Did you mean to use a sigmoid instead?"
+        )
+    if any_symbolic_tensors((x,)):
+        return Softmax(axis).symbolic_call(x)
+    if isinstance(axis, tuple):
+        axis_to_keep = [v for v in range(len(x.shape)) if v not in axis]
+
+        x_transposed = backend.numpy.transpose(x, axes=(*axis_to_keep, *axis))
+        x_reshaped = backend.numpy.reshape(
+            x_transposed, (*[x.shape[v] for v in axis_to_keep], -1)
+        )
+
+        x = backend.nn.softmax(x_reshaped, axis=-1)
+
+        x = backend.numpy.reshape(x, x_transposed.shape)
+        x = backend.numpy.transpose(
+            x, axes=list(backend.numpy.argsort([*axis_to_keep, *axis]))
+        )
+        return x
+    else:
+        return backend.nn.softmax(x, axis=axis)
+
+
+class LogSoftmax(Operation):
+    def __init__(self, axis=-1):
+        super().__init__()
+        self.axis = axis
+
+    def call(self, x):
+        return backend.nn.log_softmax(x, axis=self.axis)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(
+    [
+        "keras.ops.log_softmax",
+        "keras.ops.nn.log_softmax",
+    ]
+)
+def log_softmax(x, axis=-1):
+    """Log-softmax activation function.
+
+    It is defined as:
+    `f(x) = x - max(x) - log(sum(exp(x - max(x))))`
+
+    Args:
+        x: Input tensor.
+        axis: Integer, axis along which the log-softmax is applied.
+            Defaults to `-1`.
+
+    Returns:
+        A tensor with the same shape as `x`.
+
+    Example:
+
+    >>> x = np.array([-1., 0., 1.])
+    >>> x_log_softmax = keras.ops.log_softmax(x)
+    >>> print(x_log_softmax)
+    array([-2.40760596, -1.40760596, -0.40760596], shape=(3,), dtype=float64)
+
+    """
+    if any_symbolic_tensors((x,)):
+        return LogSoftmax(axis).symbolic_call(x)
+    if isinstance(axis, tuple):
+        axis_to_keep = [v for v in range(len(x.shape)) if v not in axis]
+
+        x_transposed = backend.numpy.transpose(x, axes=(*axis_to_keep, *axis))
+        x_reshaped = backend.numpy.reshape(
+            x_transposed, (*[x.shape[v] for v in axis_to_keep], -1)
+        )
+
+        x = backend.nn.log_softmax(x_reshaped, axis=-1)
+
+        x = backend.numpy.reshape(x, x_transposed.shape)
+        x = backend.numpy.transpose(
+            x, axes=list(backend.numpy.argsort([*axis_to_keep, *axis]))
+        )
+        return x
+    else:
+        return backend.nn.log_softmax(x, axis=axis)
+
+
+class Sparsemax(Operation):
+    def __init__(self, axis=-1):
+        super().__init__()
+        self.axis = axis
+
+    def call(self, x):
+        return backend.nn.sparsemax(x, axis=self.axis)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.sparsemax", "keras.ops.nn.sparsemax"])
+def sparsemax(x, axis=-1):
+    """Sparsemax activation function.
+
+    For each batch `i`, and class `j`,
+    sparsemax activation function is defined as:
+
+    `sparsemax(x)[i, j] = max(x[i, j] - τ(x[i, :]), 0).`
+
+    Args:
+        x: Input tensor.
+        axis: `int`, axis along which the sparsemax operation is applied.
+
+    Returns:
+        A tensor, output of sparsemax transformation. Has the same type and
+        shape as `x`.
+
+    Example:
+
+    >>> x = np.array([-1., 0., 1.])
+    >>> x_sparsemax = keras.ops.sparsemax(x)
+    >>> print(x_sparsemax)
+    array([0., 0., 1.], shape=(3,), dtype=float64)
+
+    """
+    if any_symbolic_tensors((x,)):
+        return Sparsemax(axis).symbolic_call(x)
+    return backend.nn.sparsemax(x, axis=axis)
+
+
+class MaxPool(Operation):
+    def __init__(
+        self,
+        pool_size,
+        strides=None,
+        padding="valid",
+        data_format=None,
+    ):
+        super().__init__()
+        self.pool_size = pool_size
+        self.strides = strides
+        self.padding = padding.lower()
+        self.data_format = data_format
+
+    def call(self, inputs):
+        return backend.nn.max_pool(
+            inputs,
+            self.pool_size,
+            self.strides,
+            self.padding,
+            self.data_format,
+        )
+
+    def compute_output_spec(self, inputs):
+        output_shape = operation_utils.compute_pooling_output_shape(
+            inputs.shape,
+            self.pool_size,
+            self.strides,
+            self.padding,
+            self.data_format,
+        )
+        return KerasTensor(output_shape, dtype=inputs.dtype)
+
+
+@keras_export(["keras.ops.max_pool", "keras.ops.nn.max_pool"])
+def max_pool(
+    inputs,
+    pool_size,
+    strides=None,
+    padding="valid",
+    data_format=None,
+):
+    """Max pooling operation.
+
+    Args:
+        inputs: Tensor of rank N+2. `inputs` has shape
+            `(batch_size,) + inputs_spatial_shape + (num_channels,)` if
+            `data_format="channels_last"`, or
+            `(batch_size, num_channels) + inputs_spatial_shape` if
+            `data_format="channels_first"`. Pooling happens over the spatial
+            dimensions only.
+        pool_size: int or tuple/list of integers of size
+            `len(inputs_spatial_shape)`, specifying the size of the pooling
+            window for each spatial dimension of the input tensor. If
+            `pool_size` is int, then every spatial dimension shares the same
+            `pool_size`.
+        strides: int or tuple/list of integers of size
+            `len(inputs_spatial_shape)`. The stride of the sliding window for
+            each spatial dimension of the input tensor. If `strides` is int,
+            then every spatial dimension shares the same `strides`.
+        padding: string, either `"valid"` or `"same"`. `"valid"` means no
+            padding is applied, and `"same"` results in padding evenly to the
+            left/right or up/down of the input such that output has the
+            same height/width dimension as the input when `strides=1`.
+        data_format: A string, either `"channels_last"` or `"channels_first"`.
+            `data_format` determines the ordering of the dimensions in the
+            inputs. If `data_format="channels_last"`, `inputs` is of shape
+            `(batch_size, ..., channels)` while if
+            `data_format="channels_first"`, `inputs` is of shape
+            `(batch_size, channels, ...)`.
+
+    Returns:
+        A tensor of rank N+2, the result of the max pooling operation.
+    """
+    data_format = standardize_data_format(data_format)
+    padding = padding.lower()
+    if any_symbolic_tensors((inputs,)):
+        return MaxPool(
+            pool_size,
+            strides,
+            padding,
+            data_format,
+        ).symbolic_call(inputs)
+    return backend.nn.max_pool(inputs, pool_size, strides, padding, data_format)
+
+
+class AveragePool(Operation):
+    def __init__(
+        self,
+        pool_size,
+        strides=None,
+        padding="valid",
+        data_format=None,
+    ):
+        super().__init__()
+        self.pool_size = pool_size
+        self.strides = strides
+        self.padding = padding.lower()
+        self.data_format = data_format
+
+    def call(self, inputs):
+        return backend.nn.average_pool(
+            inputs,
+            self.pool_size,
+            self.strides,
+            self.padding,
+            self.data_format,
+        )
+
+    def compute_output_spec(self, inputs):
+        output_shape = operation_utils.compute_pooling_output_shape(
+            inputs.shape,
+            self.pool_size,
+            self.strides,
+            self.padding,
+            self.data_format,
+        )
+        return KerasTensor(output_shape, dtype=inputs.dtype)
+
+
+@keras_export(
+    [
+        "keras.ops.average_pool",
+        "keras.ops.nn.average_pool",
+    ]
+)
+def average_pool(
+    inputs,
+    pool_size,
+    strides=None,
+    padding="valid",
+    data_format=None,
+):
+    """Average pooling operation.
+
+    Args:
+        inputs: Tensor of rank N+2. `inputs` has shape
+            `(batch_size,) + inputs_spatial_shape + (num_channels,)` if
+            `data_format="channels_last"`, or
+            `(batch_size, num_channels) + inputs_spatial_shape` if
+            `data_format="channels_first"`. Pooling happens over the spatial
+            dimensions only.
+        pool_size: int or tuple/list of integers of size
+            `len(inputs_spatial_shape)`, specifying the size of the pooling
+            window for each spatial dimension of the input tensor. If
+            `pool_size` is int, then every spatial dimension shares the same
+            `pool_size`.
+        strides: int or tuple/list of integers of size
+            `len(inputs_spatial_shape)`. The stride of the sliding window for
+            each spatial dimension of the input tensor. If `strides` is int,
+            then every spatial dimension shares the same `strides`.
+        padding: string, either `"valid"` or `"same"`. `"valid"` means no
+            padding is applied, and `"same"` results in padding evenly to the
+            left/right or up/down of the input such that output has the
+            same height/width dimension as the input when `strides=1`.
+        data_format: A string, either `"channels_last"` or `"channels_first"`.
+            `data_format` determines the ordering of the dimensions in the
+            inputs. If `data_format="channels_last"`, `inputs` is of shape
+            `(batch_size, ..., channels)` while if
+            `data_format="channels_first"`, `inputs` is of shape
+            `(batch_size, channels, ...)`.
+
+    Returns:
+        A tensor of rank N+2, the result of the average pooling operation.
+    """
+    data_format = standardize_data_format(data_format)
+    padding = padding.lower()
+    if any_symbolic_tensors((inputs,)):
+        return AveragePool(
+            pool_size,
+            strides,
+            padding,
+            data_format,
+        ).symbolic_call(inputs)
+    return backend.nn.average_pool(
+        inputs, pool_size, strides, padding, data_format
+    )
+
+
+class Conv(Operation):
+    def __init__(
+        self,
+        strides=1,
+        padding="valid",
+        data_format=None,
+        dilation_rate=1,
+    ):
+        super().__init__()
+        self.strides = strides
+        self.padding = padding.lower()
+        self.data_format = data_format
+        self.dilation_rate = dilation_rate
+
+    def call(self, inputs, kernel):
+        return backend.nn.conv(
+            inputs,
+            kernel,
+            strides=self.strides,
+            padding=self.padding,
+            data_format=self.data_format,
+            dilation_rate=self.dilation_rate,
+        )
+
+    def compute_output_spec(self, inputs, kernel):
+        output_shape = operation_utils.compute_conv_output_shape(
+            inputs.shape,
+            kernel.shape[-1],
+            kernel.shape[:-2],
+            self.strides,
+            self.padding,
+            self.data_format,
+            self.dilation_rate,
+        )
+        return KerasTensor(output_shape, dtype=inputs.dtype)
+
+
+@keras_export(["keras.ops.conv", "keras.ops.nn.conv"])
+def conv(
+    inputs,
+    kernel,
+    strides=1,
+    padding="valid",
+    data_format=None,
+    dilation_rate=1,
+):
+    """General N-D convolution.
+
+    This ops supports 1D, 2D and 3D convolution.
+
+    Args:
+        inputs: Tensor of rank N+2. `inputs` has shape
+            `(batch_size,) + inputs_spatial_shape + (num_channels,)` if
+            `data_format="channels_last"`, or
+            `(batch_size, num_channels) + inputs_spatial_shape` if
+            `data_format="channels_first"`.
+        kernel: Tensor of rank N+2. `kernel` has shape
+            `(kernel_spatial_shape, num_input_channels, num_output_channels)`.
+            `num_input_channels` should match the number of channels in
+            `inputs`.
+        strides: int or int tuple/list of `len(inputs_spatial_shape)`,
+            specifying the strides of the convolution along each spatial
+            dimension. If `strides` is int, then every spatial dimension shares
+            the same `strides`.
+        padding: string, either `"valid"` or `"same"`. `"valid"` means no
+            padding is applied, and `"same"` results in padding evenly to the
+            left/right or up/down of the input such that output has the
+            same height/width dimension as the input when `strides=1`.
+        data_format: A string, either `"channels_last"` or `"channels_first"`.
+            `data_format` determines the ordering of the dimensions in the
+            inputs. If `data_format="channels_last"`, `inputs` is of shape
+            `(batch_size, ..., channels)` while if
+            `data_format="channels_first"`, `inputs` is of shape
+            `(batch_size, channels, ...)`.
+        dilation_rate: int or int tuple/list of `len(inputs_spatial_shape)`,
+            specifying the dilation rate to use for dilated convolution. If
+            `dilation_rate` is int, then every spatial dimension shares
+            the same `dilation_rate`.
+
+    Returns:
+        A tensor of rank N+2, the result of the conv operation.
+    """
+    data_format = standardize_data_format(data_format)
+    padding = padding.lower()
+    if any_symbolic_tensors((inputs,)):
+        return Conv(strides, padding, data_format, dilation_rate).symbolic_call(
+            inputs, kernel
+        )
+    return backend.nn.conv(
+        inputs, kernel, strides, padding, data_format, dilation_rate
+    )
+
+
+class DepthwiseConv(Operation):
+    def __init__(
+        self,
+        strides=1,
+        padding="valid",
+        data_format=None,
+        dilation_rate=1,
+    ):
+        super().__init__()
+        self.strides = strides
+        self.padding = padding.lower()
+        self.data_format = data_format
+        self.dilation_rate = dilation_rate
+
+    def call(self, inputs, kernel):
+        return backend.nn.depthwise_conv(
+            inputs,
+            kernel,
+            self.strides,
+            self.padding,
+            self.data_format,
+            self.dilation_rate,
+        )
+
+    def compute_output_spec(self, inputs, kernel):
+        output_shape = operation_utils.compute_conv_output_shape(
+            inputs.shape,
+            kernel.shape[-1] * kernel.shape[-2],
+            kernel.shape[:-2],
+            self.strides,
+            self.padding,
+            self.data_format,
+            self.dilation_rate,
+        )
+        return KerasTensor(output_shape, dtype=inputs.dtype)
+
+
+@keras_export(
+    [
+        "keras.ops.depthwise_conv",
+        "keras.ops.nn.depthwise_conv",
+    ]
+)
+def depthwise_conv(
+    inputs,
+    kernel,
+    strides=1,
+    padding="valid",
+    data_format=None,
+    dilation_rate=1,
+):
+    """General N-D depthwise convolution.
+
+    This ops supports 1D and 2D depthwise convolution.
+
+    Args:
+        inputs: Tensor of rank N+2. `inputs` has shape
+            `(batch_size,) + inputs_spatial_shape + (num_channels,)` if
+            `data_format="channels_last"`, or
+            `(batch_size, num_channels) + inputs_spatial_shape` if
+            `data_format="channels_first"`.
+        kernel: Tensor of rank N+2. `kernel` has shape
+            [kernel_spatial_shape, num_input_channels, num_channels_multiplier],
+            `num_input_channels` should match the number of channels in
+            `inputs`.
+        strides: int or int tuple/list of `len(inputs_spatial_shape)`,
+            specifying the strides of the convolution along each spatial
+            dimension. If `strides` is int, then every spatial dimension shares
+            the same `strides`.
+        padding: string, either `"valid"` or `"same"`. `"valid"` means no
+            padding is applied, and `"same"` results in padding evenly to the
+            left/right or up/down of the input such that output has the
+            same height/width dimension as the input when `strides=1`.
+        data_format: A string, either `"channels_last"` or `"channels_first"`.
+            `data_format` determines the ordering of the dimensions in the
+            inputs. If `data_format="channels_last"`, `inputs` is of shape
+            `(batch_size, ..., channels)` while if
+            `data_format="channels_first"`, `inputs` is of shape
+            `(batch_size, channels, ...)`.
+        dilation_rate: int or int tuple/list of `len(inputs_spatial_shape)`,
+            specifying the dilation rate to use for dilated convolution. If
+            `dilation_rate` is int, then every spatial dimension shares
+            the same `dilation_rate`.
+
+    Returns:
+        A tensor of rank N+2, the result of the depthwise conv operation.
+    """
+    data_format = standardize_data_format(data_format)
+    padding = padding.lower()
+    if any_symbolic_tensors((inputs,)):
+        return DepthwiseConv(
+            strides, padding, data_format, dilation_rate
+        ).symbolic_call(inputs, kernel)
+    return backend.nn.depthwise_conv(
+        inputs,
+        kernel,
+        strides,
+        padding,
+        data_format,
+        dilation_rate,
+    )
+
+
+class SeparableConv(Operation):
+    def __init__(
+        self,
+        strides=1,
+        padding="valid",
+        data_format=None,
+        dilation_rate=1,
+    ):
+        super().__init__()
+        self.strides = strides
+        self.padding = padding.lower()
+        self.data_format = data_format
+        self.dilation_rate = dilation_rate
+
+    def call(self, inputs, depthwise_kernel, pointwise_kernel):
+        return backend.nn.separable_conv(
+            inputs,
+            depthwise_kernel,
+            pointwise_kernel,
+            self.strides,
+            self.padding,
+            self.data_format,
+            self.dilation_rate,
+        )
+
+    def compute_output_spec(self, inputs, depthwise_kernel, pointwise_kernel):
+        output_shape = list(
+            depthwise_conv(
+                inputs,
+                depthwise_kernel,
+                self.strides,
+                self.padding,
+                self.data_format,
+                self.dilation_rate,
+            ).shape
+        )
+        if self.data_format == "channels_last":
+            output_shape[-1] = pointwise_kernel.shape[-1]
+        else:
+            output_shape[1] = pointwise_kernel.shape[-1]
+        return KerasTensor(output_shape, dtype=inputs.dtype)
+
+
+@keras_export(
+    [
+        "keras.ops.separable_conv",
+        "keras.ops.nn.separable_conv",
+    ]
+)
+def separable_conv(
+    inputs,
+    depthwise_kernel,
+    pointwise_kernel,
+    strides=1,
+    padding="valid",
+    data_format=None,
+    dilation_rate=1,
+):
+    """General N-D separable convolution.
+
+    This ops supports 1D and 2D separable convolution. `separable_conv` is
+    a depthwise conv followed by a pointwise conv.
+
+    Args:
+        inputs: Tensor of rank N+2. `inputs` has shape
+            `(batch_size,) + inputs_spatial_shape + (num_channels,)` if
+            `data_format="channels_last"`, or
+            `(batch_size, num_channels) + inputs_spatial_shape` if
+            `data_format="channels_first"`.
+        depthwise_kernel: Tensor of rank N+2. `depthwise_kernel` has shape
+            [kernel_spatial_shape, num_input_channels, num_channels_multiplier],
+            `num_input_channels` should match the number of channels in
+            `inputs`.
+        pointwise_kernel: Tensor of rank N+2. `pointwise_kernel` has shape
+            `(*ones_like(kernel_spatial_shape),
+            num_input_channels * num_channels_multiplier, num_output_channels)`.
+        strides: int or int tuple/list of `len(inputs_spatial_shape)`,
+            specifying the strides of the convolution along each spatial
+            dimension. If `strides` is int, then every spatial dimension shares
+            the same `strides`.
+        padding: string, either `"valid"` or `"same"`. `"valid"` means no
+            padding is applied, and `"same"` results in padding evenly to the
+            left/right or up/down of the input such that output has the
+            same height/width dimension as the input when `strides=1`.
+        data_format: A string, either `"channels_last"` or `"channels_first"`.
+            `data_format` determines the ordering of the dimensions in the
+            inputs. If `data_format="channels_last"`, `inputs` is of shape
+            `(batch_size, ..., channels)` while if
+            `data_format="channels_first"`, `inputs` is of shape
+            `(batch_size, channels, ...)`.
+        dilation_rate: int or int tuple/list of `len(inputs_spatial_shape)`,
+            specifying the dilation rate to use for dilated convolution. If
+            `dilation_rate` is int, then every spatial dimension shares
+            the same `dilation_rate`.
+
+    Returns:
+        A tensor of rank N+2, the result of the depthwise conv operation.
+    """
+    data_format = standardize_data_format(data_format)
+    padding = padding.lower()
+    if any_symbolic_tensors((inputs,)):
+        return SeparableConv(
+            strides,
+            padding,
+            data_format,
+            dilation_rate,
+        ).symbolic_call(inputs, depthwise_kernel, pointwise_kernel)
+    return backend.nn.separable_conv(
+        inputs,
+        depthwise_kernel,
+        pointwise_kernel,
+        strides,
+        padding,
+        data_format,
+        dilation_rate,
+    )
+
+
+class ConvTranspose(Operation):
+    def __init__(
+        self,
+        strides,
+        padding="valid",
+        output_padding=None,
+        data_format=None,
+        dilation_rate=1,
+    ):
+        super().__init__()
+        self.strides = strides
+        self.output_padding = output_padding
+        self.padding = padding.lower()
+        self.data_format = data_format
+        self.dilation_rate = dilation_rate
+
+    def call(
+        self,
+        inputs,
+        kernel,
+    ):
+        return backend.nn.conv_transpose(
+            inputs,
+            kernel,
+            self.strides,
+            self.output_padding,
+            self.padding,
+            self.data_format,
+            self.dilation_rate,
+        )
+
+    def compute_output_spec(self, inputs, kernel):
+        kernel_size = kernel.shape[:-2]
+        filters = kernel.shape[-2]
+        output_shape = compute_conv_transpose_output_shape(
+            inputs.shape,
+            kernel_size,
+            filters,
+            self.strides,
+            self.padding,
+            self.output_padding,
+            self.data_format,
+            self.dilation_rate,
+        )
+        return KerasTensor(output_shape, dtype=inputs.dtype)
+
+
+@keras_export(
+    [
+        "keras.ops.conv_transpose",
+        "keras.ops.nn.conv_transpose",
+    ]
+)
+def conv_transpose(
+    inputs,
+    kernel,
+    strides,
+    padding="valid",
+    output_padding=None,
+    data_format=None,
+    dilation_rate=1,
+):
+    """General N-D convolution transpose.
+
+    Also known as de-convolution. This ops supports 1D, 2D and 3D convolution.
+
+    Args:
+        inputs: Tensor of rank N+2. `inputs` has shape
+            `(batch_size,) + inputs_spatial_shape + (num_channels,)` if
+            `data_format="channels_last"`, or
+            `(batch_size, num_channels) + inputs_spatial_shape` if
+            `data_format="channels_first"`.
+        kernel: Tensor of rank N+2. `kernel` has shape
+            [kernel_spatial_shape, num_output_channels, num_input_channels],
+            `num_input_channels` should match the number of channels in
+            `inputs`.
+        strides: int or int tuple/list of `len(inputs_spatial_shape)`,
+            specifying the strides of the convolution along each spatial
+            dimension. If `strides` is int, then every spatial dimension shares
+            the same `strides`.
+        padding: string, either `"valid"` or `"same"`. `"valid"` means no
+            padding is applied, and `"same"` results in padding evenly to the
+            left/right or up/down of the input such that output has the
+            same height/width dimension as the input when `strides=1`.
+        output_padding: int or int tuple/list of `len(inputs_spatial_shape)`,
+            specifying the amount of padding along the height and width of
+            the output tensor. Can be a single integer to specify the same
+            value for all spatial dimensions. The amount of output padding
+            along a given dimension must be lower than the stride along that
+            same dimension. If set to `None` (default), the output shape is
+            inferred.
+        data_format: A string, either `"channels_last"` or `"channels_first"`.
+            `data_format` determines the ordering of the dimensions in the
+            inputs. If `data_format="channels_last"`, `inputs` is of shape
+            `(batch_size, ..., channels)` while if
+            `data_format="channels_first"`, `inputs` is of shape
+            `(batch_size, channels, ...)`.
+        dilation_rate: int or int tuple/list of `len(inputs_spatial_shape)`,
+            specifying the dilation rate to use for dilated convolution. If
+            `dilation_rate` is int, then every spatial dimension shares
+            the same `dilation_rate`.
+
+    Returns:
+        A tensor of rank N+2, the result of the conv operation.
+    """
+    data_format = standardize_data_format(data_format)
+    padding = padding.lower()
+    if any_symbolic_tensors((inputs,)):
+        return ConvTranspose(
+            strides, padding, output_padding, data_format, dilation_rate
+        ).symbolic_call(inputs, kernel)
+    return backend.nn.conv_transpose(
+        inputs,
+        kernel,
+        strides,
+        padding,
+        output_padding,
+        data_format,
+        dilation_rate,
+    )
+
+
+class OneHot(Operation):
+    def __init__(self, num_classes, axis=-1, dtype=None, sparse=False):
+        super().__init__()
+        self.num_classes = num_classes
+        self.axis = axis
+        self.dtype = dtype or backend.floatx()
+        self.sparse = sparse
+
+    def call(self, x):
+        return backend.nn.one_hot(
+            x,
+            self.num_classes,
+            axis=self.axis,
+            dtype=self.dtype,
+            sparse=self.sparse,
+        )
+
+    def compute_output_spec(self, x):
+        x_shape = list(getattr(x, "shape", []))
+        if self.axis == -1:
+            x_shape.append(self.num_classes)
+        elif self.axis >= 0 and self.axis < len(x_shape):
+            x_shape.insert(self.axis, self.num_classes)
+        else:
+            raise ValueError(
+                f"axis must be -1 or between [0, {len(x.shape)}), but "
+                f"received {self.axis}."
+            )
+        return KerasTensor(x_shape, dtype=self.dtype, sparse=self.sparse)
+
+
+@keras_export(["keras.ops.one_hot", "keras.ops.nn.one_hot"])
+def one_hot(x, num_classes, axis=-1, dtype=None, sparse=False):
+    """Converts integer tensor `x` into a one-hot tensor.
+
+    The one-hot encoding is a representation where each integer value is
+    converted into a binary vector with a length equal to `num_classes`,
+    and the index corresponding to the integer value is marked as 1, while
+    all other indices are marked as 0.
+
+    Args:
+        x: Integer tensor to be encoded. The shape can be
+            arbitrary, but the dtype should be integer.
+        num_classes: Number of classes for the one-hot encoding.
+        axis: Axis along which the encoding is performed.
+            `-1` represents the last axis. Defaults to `-1`.
+        dtype: (Optional) Data type of the output tensor. If not
+            provided, it defaults to the default data type of the backend.
+        sparse: Whether to return a sparse tensor; for backends that support
+            sparse tensors.
+
+    Returns:
+        Integer tensor: One-hot encoded tensor with the same shape as `x`
+        except for the specified `axis` dimension, which will have
+        a length of `num_classes`. The dtype of the output tensor
+        is determined by `dtype` or the default data type of the backend.
+
+    Example:
+
+    >>> x = keras.ops.convert_to_tensor([1, 3, 2, 0])
+    >>> one_hot(x, num_classes=4)
+    array([[0. 1. 0. 0.]
+           [0. 0. 0. 1.]
+           [0. 0. 1. 0.]
+           [1. 0. 0. 0.]], shape=(4, 4), dtype=float32)
+    """
+    if any_symbolic_tensors((x,)):
+        return OneHot(
+            num_classes, axis=axis, dtype=dtype, sparse=sparse
+        ).symbolic_call(x)
+    return backend.nn.one_hot(
+        x,
+        num_classes,
+        axis=axis,
+        dtype=dtype or backend.floatx(),
+        sparse=sparse,
+    )
+
+
+class BinaryCrossentropy(Operation):
+    def __init__(self, from_logits=False):
+        super().__init__()
+        self.from_logits = from_logits
+
+    def call(self, target, output):
+        return backend.nn.binary_crossentropy(
+            target, output, from_logits=self.from_logits
+        )
+
+    def compute_output_spec(self, target, output):
+        if target.shape != output.shape:
+            raise ValueError(
+                "Arguments `target` and `output` must have the same shape. "
+                "Received: "
+                f"target.shape={target.shape}, output.shape={output.shape}"
+            )
+        return KerasTensor(output.shape, dtype=output.dtype)
+
+
+@keras_export(
+    [
+        "keras.ops.binary_crossentropy",
+        "keras.ops.nn.binary_crossentropy",
+    ]
+)
+def binary_crossentropy(target, output, from_logits=False):
+    """Computes binary cross-entropy loss between target and output tensor.
+
+    The binary cross-entropy loss is commonly used in binary
+    classification tasks where each input sample belongs to one
+    of the two classes. It measures the dissimilarity between the
+    target and output probabilities or logits.
+
+    Args:
+        target: The target tensor representing the true binary labels.
+            Its shape should match the shape of the `output` tensor.
+        output: The output tensor representing the predicted probabilities
+            or logits. Its shape should match the shape of the
+            `target` tensor.
+        from_logits: (optional) Whether `output` is a tensor of logits or
+            probabilities.
+            Set it to `True` if `output` represents logits; otherwise,
+            set it to `False` if `output` represents probabilities.
+            Defaults to `False`.
+
+    Returns:
+        Integer tensor: The computed binary cross-entropy loss between
+        `target` and `output`.
+
+    Example:
+
+    >>> target = keras.ops.convert_to_tensor([0, 1, 1, 0])
+    >>> output = keras.ops.convert_to_tensor([0.1, 0.9, 0.8, 0.2])
+    >>> binary_crossentropy(target, output)
+    array([0.10536054 0.10536054 0.22314355 0.22314355],
+          shape=(4,), dtype=float32)
+    """
+    if any_symbolic_tensors((target, output)):
+        return BinaryCrossentropy(from_logits=from_logits).symbolic_call(
+            target, output
+        )
+    return backend.nn.binary_crossentropy(
+        target, output, from_logits=from_logits
+    )
+
+
+class CategoricalCrossentropy(Operation):
+    def __init__(self, from_logits=False, axis=-1):
+        super().__init__()
+        self.from_logits = from_logits
+        self.axis = axis
+
+    def call(self, target, output):
+        return backend.nn.categorical_crossentropy(
+            target, output, from_logits=self.from_logits, axis=self.axis
+        )
+
+    def compute_output_spec(self, target, output):
+        if target.shape != output.shape:
+            raise ValueError(
+                "Arguments `target` and `output` must have the same shape. "
+                "Received: "
+                f"target.shape={target.shape}, output.shape={output.shape}"
+            )
+        if len(target.shape) < 1:
+            raise ValueError(
+                "Arguments `target` and `output` must be at least rank 1. "
+                "Received: "
+                f"target.shape={target.shape}, output.shape={output.shape}"
+            )
+        return KerasTensor(output.shape[:-1], dtype=output.dtype)
+
+
+@keras_export(
+    [
+        "keras.ops.categorical_crossentropy",
+        "keras.ops.nn.categorical_crossentropy",
+    ]
+)
+def categorical_crossentropy(target, output, from_logits=False, axis=-1):
+    """Computes categorical cross-entropy loss between target and output tensor.
+
+    The categorical cross-entropy loss is commonly used in multi-class
+    classification tasks where each input sample can belong to one of
+    multiple classes. It measures the dissimilarity
+    between the target and output probabilities or logits.
+
+    Args:
+        target: The target tensor representing the true categorical labels.
+            Its shape should match the shape of the `output` tensor
+            except for the last dimension.
+        output: The output tensor representing the predicted probabilities
+            or logits. Its shape should match the shape of the `target`
+            tensor except for the last dimension.
+        from_logits: (optional) Whether `output` is a tensor of logits or
+            probabilities.
+            Set it to `True` if `output` represents logits; otherwise,
+            set it to `False` if `output` represents probabilities.
+            Defaults to `False`.
+        axis: (optional) The axis along which the categorical cross-entropy
+            is computed.
+            Defaults to `-1`, which corresponds to the last dimension of
+            the tensors.
+
+    Returns:
+        Integer tensor: The computed categorical cross-entropy loss between
+        `target` and `output`.
+
+    Example:
+
+    >>> target = keras.ops.convert_to_tensor(
+    ... [[1, 0, 0],
+    ...  [0, 1, 0],
+    ...  [0, 0, 1]])
+    >>> output = keras.ops.convert_to_tensor(
+    ... [[0.9, 0.05, 0.05],
+    ...  [0.1, 0.8, 0.1],
+    ...  [0.2, 0.3, 0.5]])
+    >>> categorical_crossentropy(target, output)
+    array([0.10536054 0.22314355 0.6931472 ], shape=(3,), dtype=float32)
+    """
+    if any_symbolic_tensors((target, output)):
+        return CategoricalCrossentropy(
+            from_logits=from_logits, axis=axis
+        ).symbolic_call(target, output)
+    return backend.nn.categorical_crossentropy(
+        target, output, from_logits=from_logits, axis=axis
+    )
+
+
+class SparseCategoricalCrossentropy(Operation):
+    def __init__(self, from_logits=False, axis=-1):
+        super().__init__()
+        self.from_logits = from_logits
+        self.axis = axis
+
+    def call(self, target, output):
+        return backend.nn.sparse_categorical_crossentropy(
+            target, output, from_logits=self.from_logits, axis=self.axis
+        )
+
+    def compute_output_spec(self, target, output):
+        if len(output.shape) < 1:
+            raise ValueError(
+                "Argument `output` must be at least rank 1. "
+                "Received: "
+                f"output.shape={output.shape}"
+            )
+        target_shape = target.shape
+        if len(target_shape) == len(output.shape) and target_shape[-1] == 1:
+            target_shape = target_shape[:-1]
+        if target_shape != output.shape[:-1]:
+            raise ValueError(
+                "Arguments `target` and `output` must have the same shape "
+                "up until the last dimension: "
+                f"target.shape={target.shape}, output.shape={output.shape}"
+            )
+        return KerasTensor(output.shape[:-1], dtype=output.dtype)
+
+
+@keras_export(
+    [
+        "keras.ops.sparse_categorical_crossentropy",
+        "keras.ops.nn.sparse_categorical_crossentropy",
+    ]
+)
+def sparse_categorical_crossentropy(target, output, from_logits=False, axis=-1):
+    """Computes sparse categorical cross-entropy loss.
+
+    The sparse categorical cross-entropy loss is similar to categorical
+    cross-entropy, but it is used when the target tensor contains integer
+    class labels instead of one-hot encoded vectors. It measures the
+    dissimilarity between the target and output probabilities or logits.
+
+    Args:
+        target: The target tensor representing the true class labels as
+            integers. Its shape should match the shape of the `output`
+            tensor except for the last dimension.
+        output: The output tensor representing the predicted probabilities
+            or logits.
+            Its shape should match the shape of the `target` tensor except
+            for the last dimension.
+        from_logits: (optional) Whether `output` is a tensor of logits
+            or probabilities.
+            Set it to `True` if `output` represents logits; otherwise,
+            set it to `False` if `output` represents probabilities.
+            Defaults to `False`.
+        axis: (optional) The axis along which the sparse categorical
+            cross-entropy is computed.
+            Defaults to `-1`, which corresponds to the last dimension
+            of the tensors.
+
+    Returns:
+        Integer tensor: The computed sparse categorical cross-entropy
+        loss between `target` and `output`.
+
+    Example:
+
+    >>> target = keras.ops.convert_to_tensor([0, 1, 2], dtype=int32)
+    >>> output = keras.ops.convert_to_tensor(
+    ... [[0.9, 0.05, 0.05],
+    ...  [0.1, 0.8, 0.1],
+    ...  [0.2, 0.3, 0.5]])
+    >>> sparse_categorical_crossentropy(target, output)
+    array([0.10536056 0.22314355 0.6931472 ], shape=(3,), dtype=float32)
+    """
+    if any_symbolic_tensors((target, output)):
+        return SparseCategoricalCrossentropy(
+            from_logits=from_logits, axis=axis
+        ).symbolic_call(target, output)
+    return backend.nn.sparse_categorical_crossentropy(
+        target, output, from_logits=from_logits, axis=axis
+    )
+
+
+class MultiHot(Operation):
+    def __init__(
+        self, num_classes=None, axis=-1, dtype=None, sparse=False, **kwargs
+    ):
+        if num_classes is None and "num_tokens" in kwargs:
+            num_classes = kwargs.pop("num_tokens")
+        if num_classes is None:
+            raise ValueError("Argument `num_classes` must be specified.")
+        super().__init__(**kwargs)
+        self.num_classes = num_classes
+        self.axis = axis
+        self.dtype = dtype or backend.floatx()
+        self.sparse = sparse
+
+    def call(self, inputs):
+        return backend.nn.multi_hot(
+            inputs,
+            num_classes=self.num_classes,
+            axis=self.axis,
+            dtype=self.dtype,
+        )
+
+    def compute_output_spec(self, inputs):
+        x_shape = list(getattr(inputs, "shape", []))
+        if self.axis == -1:
+            x_shape.append(self.num_classes)
+        elif self.axis >= 0 and self.axis < len(x_shape):
+            x_shape.insert(self.axis, self.num_classes)
+        else:
+            raise ValueError(
+                f"axis must be -1 or between [0, {len(inputs.shape)}), but "
+                f"received {self.axis}."
+            )
+
+        if len(x_shape) == 2:
+            x_shape = [x_shape[-1]]
+        else:
+            x_shape = [x_shape[0]] + x_shape[2:]
+
+        return KerasTensor(x_shape, dtype=inputs.dtype, sparse=self.sparse)
+
+
+@keras_export(
+    [
+        "keras.ops.multi_hot",
+        "keras.ops.nn.multi_hot",
+    ]
+)
+def multi_hot(
+    inputs, num_classes=None, axis=-1, dtype=None, sparse=False, **kwargs
+):
+    """Encodes integer labels as multi-hot vectors.
+
+    This function encodes integer labels as multi-hot vectors, where each label
+    is mapped to a binary value in the resulting vector.
+
+    Args:
+        inputs: Tensor of integer labels to be converted to multi-hot vectors.
+        num_classes: Integer, the total number of unique classes.
+        axis: (optional) Axis along which the multi-hot encoding should be
+            added. Defaults to `-1`, which corresponds to the last dimension.
+        dtype: (optional) The data type of the resulting tensor. Default
+            is backend's float type.
+        sparse: Whether to return a sparse tensor; for backends that support
+            sparse tensors.
+
+    Returns:
+        Tensor: The multi-hot encoded tensor.
+
+    Example:
+
+    >>> data = keras.ops.convert_to_tensor([0, 4])
+    >>> keras.ops.multi_hot(data, num_classes=5)
+    array([1.0, 0.0, 0.0, 0.0, 1.0], dtype=float32)
+
+    """
+    if num_classes is None and "num_tokens" in kwargs:
+        num_classes = kwargs.pop("num_tokens")
+    if num_classes is None:
+        raise ValueError("Argument `num_classes` must be specified.")
+
+    if any_symbolic_tensors((inputs,)):
+        return MultiHot(num_classes, axis, dtype, sparse).symbolic_call(inputs)
+
+    return backend.nn.multi_hot(inputs, num_classes, axis, dtype, sparse)
+
+
+class Moments(Operation):
+    def __init__(self, axes, keepdims=False, synchronized=False):
+        super().__init__()
+        self.axes = axes
+        self.keepdims = keepdims
+        self.synchronized = synchronized
+
+    def call(self, x):
+        return backend.nn.moments(
+            x,
+            axes=self.axes,
+            keepdims=self.keepdims,
+            synchronized=self.synchronized,
+        )
+
+    def compute_output_spec(self, x):
+        return (
+            KerasTensor(
+                reduce_shape(x.shape, axis=self.axes, keepdims=self.keepdims),
+                dtype=x.dtype,
+            ),
+            KerasTensor(
+                reduce_shape(x.shape, axis=self.axes, keepdims=self.keepdims),
+                dtype=x.dtype,
+            ),
+        )
+
+
+@keras_export(
+    [
+        "keras.ops.moments",
+        "keras.ops.nn.moments",
+    ]
+)
+def moments(x, axes, keepdims=False, synchronized=False):
+    """Calculates the mean and variance of `x`.
+
+    The mean and variance are calculated by aggregating the contents of `x`
+    across `axes`. If `x` is 1-D and `axes = [0]` this is just the mean and
+    variance of a vector.
+
+    Args:
+        x: Input tensor.
+        axes: A list of axes which to compute mean and variance.
+        keepdims: If this is set to `True`, the axes which are reduced are left
+            in the result as dimensions with size one.
+        synchronized: Only applicable with the TensorFlow backend.
+            If `True`, synchronizes the global batch statistics (mean and
+            variance) across all devices at each training step in a
+            distributed training strategy. If `False`, each replica uses its own
+            local batch statistics.
+
+    Returns:
+        A tuple containing two tensors - mean and variance.
+
+    Example:
+
+    >>> x = keras.ops.convert_to_tensor([0, 1, 2, 3, 100], dtype="float32")
+    >>> keras.ops.moments(x, axes=[0])
+    (array(21.2, dtype=float32), array(1553.3601, dtype=float32))
+
+    """
+    if any_symbolic_tensors((x,)):
+        return Moments(axes, keepdims, synchronized=synchronized).symbolic_call(
+            x
+        )
+
+    return backend.nn.moments(x, axes, keepdims, synchronized=synchronized)
+
+
+class BatchNorm(Operation):
+    def __init__(self, axis, epsilon):
+        super().__init__()
+        self.axis = axis
+        self.epsilon = epsilon
+
+    def _check_shape(self, name, shape, expected_shape):
+        if shape != expected_shape:
+            raise ValueError(
+                f"Arguments `{name}` must be a vector of length "
+                f"`x.shape[axis]`. Expected: `{expected_shape}`. "
+                f"Received: `{shape}."
+            )
+
+    def compute_output_spec(self, x, mean, variance, offset, scale):
+        shape = (x.shape[self.axis],)
+        self._check_shape("mean", tuple(mean.shape), shape)
+        self._check_shape("variance", tuple(variance.shape), shape)
+        if offset is not None:
+            self._check_shape("offset", tuple(offset.shape), shape)
+        if offset is not scale:
+            self._check_shape("scale", tuple(scale.shape), shape)
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(
+    [
+        "keras.ops.batch_normalization",
+        "keras.ops.nn.batch_normalization",
+    ]
+)
+def batch_normalization(
+    x, mean, variance, axis, offset=None, scale=None, epsilon=1e-3
+):
+    """Normalizes `x` by `mean` and `variance`.
+
+    This op is typically used by the batch normalization step in a neural
+    network. It normalizes the input tensor along the given axis.
+
+    Args:
+        x: Input tensor.
+        mean: A mean vector of the same length as the `axis` dimension of the
+            input thensor.
+        variance: A variance vector of the same length as the `axis` dimension
+            of the input tensor.
+        axis: Integer, the axis that should be normalized.
+        offset: An offset vector of the same length as the `axis` dimension of
+            the input tensor. If not `None`, `offset` is added to the normalized
+            tensor. Defaults to `None`.
+        scale: A scale vector of the same length as the `axis` dimension of the
+            input tensor. If not `None`, the normalized tensor is multiplied by
+            `scale`. Defaults to `None`.
+        epsilon: Small float added to variance to avoid dividing by zero.
+            Defaults to 1e-3.
+
+    Returns:
+        The normalized tensor.
+
+    Example:
+
+    >>> x = keras.ops.convert_to_tensor(
+    ...     [[0.1, 0.2, 0.3], [0.4, 0.5, 0.6], [0.7, 0.8, 0.9]]
+    ... )
+    >>> keras.ops.batch_normalization(
+    ...     x,
+    ...     mean=[0.4, 0.5, 0.6],
+    ...     variance=[0.67, 0.67, 0.67],
+    ...     axis=-1
+    ... )
+    array([[-3.6624e-01, -3.6624e-01, -3.6624e-01],
+           [-4.6445e-09,  0.0000e+00, -1.8578e-08],
+           [ 3.6624e-01,  3.6624e-01,  3.6624e-01]])
+
+    """
+    if any_symbolic_tensors((x, mean, variance, offset, scale)):
+        return BatchNorm(axis, epsilon).symbolic_call(
+            x, mean, variance, offset, scale
+        )
+
+    return backend.nn.batch_normalization(
+        x, mean, variance, axis, offset, scale, epsilon
+    )
+
+
+class CTCLoss(Operation):
+    def __init__(self, mask_index=0):
+        super().__init__()
+        self.mask_index = mask_index
+
+    def call(self, target, output, target_length, output_length):
+        return backend.nn.ctc_loss(
+            target, output, target_length, output_length, self.mask_index
+        )
+
+    def _check_shape_first_dim(self, name1, shape1, name2, shape2):
+        if shape1[0] != shape2[0]:
+            raise ValueError(
+                f"Arguments `{name1}` and `{name2}` must have the same "
+                "first dimension. "
+                f"Received shapes: `{shape1}` and `{shape2}`."
+            )
+
+    def compute_output_spec(self, target, output, target_length, output_length):
+        self._check_shape_first_dim(
+            "target", target.shape, "output", output.shape
+        )
+        self._check_shape_first_dim(
+            "target_length", target_length.shape, "target", target.shape
+        )
+        self._check_shape_first_dim(
+            "output_length", output_length.shape, "output", output.shape
+        )
+        dtype = backend.result_type(output.dtype, "float32")
+        return KerasTensor((target.shape[0],), dtype=dtype)
+
+
+@keras_export(
+    [
+        "keras.ops.ctc_loss",
+        "keras.ops.nn.ctc_loss",
+    ]
+)
+def ctc_loss(target, output, target_length, output_length, mask_index=0):
+    """CTC (Connectionist Temporal Classification) loss.
+
+    Args:
+        target: A tensor of shape `(batch_size, max_length)` containing
+            the true labels in integer format.
+        output: A tensor of shape `(batch_size, max_length, num_classes)`
+            containing logits (the output of your model).
+        target_length: A tensor of shape `(batch_size,)` containing the
+            true label lengths.
+        output_length: A tensor of shape `(batch_size,)` containing the
+            output lengths.
+        mask_index: The index of the mask character in the vocabulary.
+            Defaults to `0`.
+    """
+
+    if any_symbolic_tensors((target, output, target_length, output_length)):
+        return CTCLoss(mask_index).symbolic_call(
+            target, output, target_length, output_length
+        )
+    return backend.nn.ctc_loss(
+        target, output, target_length, output_length, mask_index
+    )
+
+
+class CTCDecode(Operation):
+    def __init__(
+        self,
+        strategy="greedy",
+        beam_width=100,
+        top_paths=1,
+        merge_repeated=True,
+        mask_index=0,
+    ):
+        super().__init__()
+        self.strategy = strategy
+        self.beam_width = beam_width
+        self.top_paths = top_paths
+        self.merge_repeated = merge_repeated
+        self.mask_index = mask_index
+
+    def call(self, inputs, sequence_lengths):
+        return backend.nn.ctc_decode(
+            inputs,
+            sequence_lengths,
+            strategy=self.strategy,
+            beam_width=self.beam_width,
+            top_paths=self.top_paths,
+            merge_repeated=self.merge_repeated,
+            mask_index=self.mask_index,
+        )
+
+    def compute_output_spec(self, inputs, sequence_lengths):
+        inputs_shape = inputs.shape
+        if self.strategy == "greedy":
+            top_paths = 1
+        else:
+            top_paths = self.top_paths
+        dtype = backend.result_type(inputs.dtype, "float32")
+        return (
+            KerasTensor(
+                (top_paths, inputs_shape[0], inputs_shape[1]), dtype="int32"
+            ),
+            KerasTensor((inputs_shape[0], top_paths), dtype=dtype),
+        )
+
+
+@keras_export(
+    [
+        "keras.ops.ctc_decode",
+        "keras.ops.nn.ctc_decode",
+    ]
+)
+def ctc_decode(
+    inputs,
+    sequence_lengths,
+    strategy="greedy",
+    beam_width=100,
+    top_paths=1,
+    merge_repeated=True,
+    mask_index=0,
+):
+    """Decodes the output of a CTC model.
+
+    Args:
+        inputs: A tensor of shape `(batch_size, max_length, num_classes)`
+            containing the logits (the output of the model).
+            They should *not* be normalized via softmax.
+        sequence_lengths: A tensor of shape `(batch_size,)` containing the
+            sequence lengths for the batch.
+        strategy: A string for the decoding strategy. Supported values are
+            `"greedy"` and `"beam_search"`.
+        beam_width: An integer scalar beam width used in beam search.
+            Defaults to 100.
+        top_paths: An integer scalar, the number of top paths to return.
+            Defaults to 1.
+        merge_repeated: A boolean scalar, whether to merge repeated
+            labels in the output. Defaults to `True`.
+        mask_index: An integer scalar, the index of the mask character in
+            the vocabulary. Defaults to `0`.
+
+    Returns:
+        A tuple containing:
+        - The tensor representing the list of decoded sequences. If
+            `strategy="greedy"`, the shape is `(1, batch_size, max_length)`. If
+            `strategy="beam_search"`, the shape is
+            `(top_paths, batch_size, max_length)`. Note that: `-1` indicates the
+            blank label.
+        - If `strategy="greedy"`, a tensor of shape `(batch_size, 1)`
+            representing the negative of the sum of the probability logits for
+            each sequence. If `strategy="beam_seatch"`, a tensor of shape
+            `(batch_size, top_paths)` representing the log probability for each
+            sequence.
+    """
+
+    if any_symbolic_tensors((inputs, sequence_lengths)):
+        return CTCDecode(
+            strategy=strategy,
+            beam_width=beam_width,
+            top_paths=top_paths,
+            merge_repeated=merge_repeated,
+            mask_index=mask_index,
+        ).symbolic_call(inputs, sequence_lengths)
+    return backend.nn.ctc_decode(
+        inputs=inputs,
+        sequence_lengths=sequence_lengths,
+        strategy=strategy,
+        beam_width=beam_width,
+        top_paths=top_paths,
+        merge_repeated=merge_repeated,
+        mask_index=mask_index,
+    )
+
+
+class Normalize(Operation):
+    def __init__(self, axis=-1, order=2, epsilon=None):
+        super().__init__()
+        self.axis = axis
+        self.order = order
+        self.epsilon = epsilon
+
+    def compute_output_spec(self, x):
+        return KerasTensor(shape=x.shape)
+
+    def call(self, x):
+        return _normalize(
+            x, axis=self.axis, order=self.order, epsilon=self.epsilon
+        )
+
+
+@keras_export(
+    [
+        "keras.ops.normalize",
+        "keras.ops.nn.normalize",
+    ]
+)
+def normalize(x, axis=-1, order=2, epsilon=None):
+    """Normalizes `x` over the specified axis.
+
+    It is defined as: `normalize(x) = x / max(norm(x), epsilon)`.
+
+    Args:
+        x: Input tensor.
+        axis: The axis or axes along which to perform normalization.
+            Default to -1.
+        order: The exponent value in the norm formulation.
+            Defaults to 2.
+        epsilon: A lower bound value for the norm.
+            Defaults to `backend.epsilon()`.
+
+    Returns:
+        The normalized array.
+
+    Example:
+
+    >>> x = keras.ops.convert_to_tensor([[1, 2, 3], [4, 5, 6]])
+    >>> x_norm = keras.ops.math.normalize(x)
+    >>> print(x_norm)
+    array([[0.26726124 0.5345225  0.8017837 ]
+           [0.45584232 0.5698029  0.68376344]], shape=(2, 3), dtype=float32)
+
+    """
+    if any_symbolic_tensors((x,)):
+        return Normalize(axis=axis, order=order, epsilon=epsilon).symbolic_call(
+            x
+        )
+    return _normalize(x, axis=axis, order=order, epsilon=epsilon)
+
+
+def _normalize(x, axis=-1, order=2, epsilon=None):
+    if not isinstance(order, int) or not order >= 1:
+        raise ValueError(
+            f"Argument `order` must be an int >= 1. Received: order={order}"
+        )
+    x = backend.convert_to_tensor(x)
+    if len(x.shape) == 0:
+        x = backend.numpy.expand_dims(x, axis=0)
+    if epsilon is None:
+        epsilon = backend.epsilon()
+    if 2 == order:
+        # A special case: L2 normalization with `x * rsqrt(...)`
+        # instead of `x / sqrt(...)`
+        square_sum = backend.numpy.sum(
+            backend.numpy.square(x), axis=axis, keepdims=True
+        )
+        inv_norm = backend.math.rsqrt(square_sum)
+        inv_norm = backend.numpy.minimum(inv_norm, 1.0 / epsilon)
+        return x * inv_norm
+    norm = backend.linalg.norm(x, ord=order, axis=axis, keepdims=True)
+    denom = backend.numpy.maximum(norm, epsilon)
+    return backend.numpy.divide(x, denom)
+
+
+class PSNR(Operation):
+    def __init__(
+        self,
+        max_val,
+    ):
+        super().__init__()
+        self.max_val = max_val
+
+    def call(self, x1, x2):
+        return backend.nn.psnr(
+            x1=x1,
+            x2=x2,
+            max_val=self.max_val,
+        )
+
+    def compute_output_spec(self, x1, x2):
+        if len(x1.shape) != len(x2.shape):
+            raise ValueError("Inputs must have the same rank")
+
+        return KerasTensor(shape=())
+
+
+@keras_export(
+    [
+        "keras.ops.psnr",
+        "keras.ops.nn.psnr",
+    ]
+)
+def psnr(
+    x1,
+    x2,
+    max_val,
+):
+    """Peak Signal-to-Noise Ratio (PSNR) function.
+
+    This function computes the Peak Signal-to-Noise Ratio between two signals,
+    `x1` and `x2`. PSNR is a measure of the quality of a reconstructed signal.
+    The higher the PSNR, the closer the reconstructed signal is to the original
+    signal. Note that it can become negative when the signal power is
+    smaller that the noise power.
+
+    Args:
+        x1: The first input signal.
+        x2: The second input signal. Must have the same shape as `x1`.
+        max_val: The maximum possible value in the signals.
+
+    Returns:
+        float: The PSNR value between `x1` and `x2`.
+
+    Examples:
+
+    >>> x1 = keras.random.normal((2, 4, 4, 3))
+    >>> x2 = keras.random.normal((2, 4, 4, 3))
+    >>> max_val = 1.0
+    >>> keras.ops.nn.psnr(x1, x2, max_val)
+    -3.1697404
+    """
+    if any_symbolic_tensors(
+        (
+            x1,
+            x2,
+        )
+    ):
+        return PSNR(
+            max_val,
+        ).symbolic_call(x1, x2)
+    return backend.nn.psnr(
+        x1,
+        x2,
+        max_val,
+    )
+
+
+class DotProductAttention(Operation):
+    def __init__(self, is_causal=False):
+        super().__init__()
+        self.is_causal = is_causal
+
+    def call(
+        self,
+        query,
+        key,
+        value,
+        bias=None,
+        mask=None,
+        scale=None,
+        flash_attention=None,
+    ):
+        return backend.nn.dot_product_attention(
+            query,
+            key,
+            value,
+            bias=bias,
+            mask=mask,
+            scale=scale,
+            is_causal=self.is_causal,
+            flash_attention=flash_attention,
+        )
+
+    def compute_output_spec(
+        self,
+        query,
+        key,
+        value,
+        bias=None,
+        mask=None,
+        scale=None,
+        flash_attention=None,
+    ):
+        return KerasTensor(query.shape, dtype=query.dtype)
+
+
+@keras_export(
+    ["keras.ops.dot_product_attention", "keras.ops.nn.dot_product_attention"]
+)
+def dot_product_attention(
+    query,
+    key,
+    value,
+    bias=None,
+    mask=None,
+    scale=None,
+    is_causal=False,
+    flash_attention=None,
+):
+    """Scaled dot product attention function.
+
+    Computes the attention function on Q (`query`), K (`key`), and V(`value`):
+    `attention(Q, K, V) = softmax(Q * K / sqrt(d)) * V`. If we define `logits`
+    as the output of `Q * K` and the `probs` as the output of `softmax`.
+
+    Throughout this function, we utilize the following notation to represent the
+    shape of array:
+    - B: batch size
+    - S: length of the key/value
+    - T: length of the query
+    - N: number of attention heads
+    - H: dimensions of each attention head
+    - K: number of key/value heads
+    - G: number of groups, which equals to `N // K`
+
+    Args:
+        query: The query array with the shape of `(B, T, N, H)`.
+        key: The key array with the shape of `(B, S, K, H)`. When `K` equals
+            `N`, multi-headed attention (MHA) is performed. Otherwise, grouped
+            query attention (GQA) is performed if `N` is a multiple of `K`. and
+            multi-query attention (MQA) is performed if `K==1` (a special case
+            of GQA).
+        value: The value array with the same shape of `key`.
+        bias: Optional bias array to be added to logits. The shape must be
+            broadcastable to `(B, N, T, S)`.
+        mask: Optional mask array used to filter out logits. It is a boolean
+            mask where `True` indicates the element should take part in
+            attention. For an additive mask, users should pass it to bias. The
+            shape must be broadcastable to `(B, N, T, S)`.
+        scale: Optional scale for the logits. If `None`, the scale will be set
+            to `1.0 / sqrt(H)`.
+        is_causal: Whether to apply causal mask.
+        flash_attention: Whether to use flash attention. If `None`, it will
+            attempt to use flash attention if the required conditions are met.
+            Typically, the inputs must be in float16 and bfloat16 dtype and the
+            input layout requirements may vary depending on the backend.
+
+    Returns:
+        An array of the attention output with the same shape of `query`.
+
+    Example:
+
+    >>> query = keras.random.normal((2, 4, 8, 16))
+    >>> key = keras.random.normal((2, 6, 8, 16))
+    >>> value = keras.random.normal((2, 6, 8, 16))
+    >>> keras.ops.nn.dot_product_attention(query, key, value).shape
+    (2, 4, 8, 16)
+    """
+    if any_symbolic_tensors((query, key, value)):
+        return DotProductAttention(is_causal=is_causal).symbolic_call(
+            query,
+            key,
+            value,
+            bias=bias,
+            mask=mask,
+            scale=scale,
+            flash_attention=flash_attention,
+        )
+    return backend.nn.dot_product_attention(
+        query,
+        key,
+        value,
+        bias=bias,
+        mask=mask,
+        scale=scale,
+        is_causal=is_causal,
+        flash_attention=flash_attention,
+    )
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/node.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/node.py
new file mode 100644
index 0000000000000000000000000000000000000000..7e05de88fcf5c87bbe63cf1682b0fee288e8572b
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/node.py
@@ -0,0 +1,143 @@
+import collections
+
+from keras.src import tree
+from keras.src.backend import KerasTensor
+from keras.src.ops.symbolic_arguments import SymbolicArguments
+
+
+class Node:
+    """A `Node` describes an operation `__call__()` event.
+
+    A Keras Function is a DAG with `Node` instances as nodes, and
+    `KerasTensor` instances as edges. Nodes aren't `Operation` instances,
+    because a single operation could be called multiple times, which would
+    result in graph cycles.
+
+    A `__call__()` event involves input tensors (and other input arguments),
+    the operation that was called, and the resulting output tensors.
+    A `Node` will include all this information.
+
+    Since a single `Operation` could be called multiple times,
+    the `Node` instances are stored on operations as a list.
+    Each time an operation is called, a node is added to `op._inbound_nodes`.
+    Each time the output of an operation is used by another operation,
+    a node is added to `op._outbound_nodes`.
+
+    Every `KerasTensor` instance has a `KerasHistory` object attached,
+    which tracks the `Node` that records the `__call__()` event that created
+    the tensor. By recursively walking through `Node` instances
+    via the `KerasHistory` metadata of `KerasTensor` instances, once can
+    retrieve the entire DAG of a Keras Function.
+
+    Args:
+        operation: The Operation that was called in the `op.__call__()`
+            event that this node represents.
+        call_args: The positional arguments the operation was called with.
+        call_kwargs: The keyword arguments the operation was called with.
+        outputs: The output tensors of the `op.__call__()` call.
+    """
+
+    def __init__(
+        self, operation, call_args=None, call_kwargs=None, outputs=None
+    ):
+        self.operation = operation
+        self.arguments = SymbolicArguments(*call_args, **call_kwargs)
+        self.outputs = [] if outputs is None else tree.flatten(outputs)
+        for x in self.outputs:
+            if not isinstance(x, KerasTensor):
+                raise ValueError(
+                    "All operation outputs must be tensors. "
+                    f"Operation {operation} returned a non-tensor. "
+                    f"Non-tensor received: {x}"
+                )
+
+        zero_history = any(
+            not x.record_history for x in self.arguments.keras_tensors
+        )
+
+        # If inputs don't have metadata yet, add it.
+        if not zero_history:
+            for tensor in self.arguments.keras_tensors:
+                if not hasattr(tensor, "_keras_history"):
+                    tensor._keras_history = KerasHistory(
+                        operation=None, node_index=0, tensor_index=0
+                    )
+
+        # Wire up Node to Operations.
+        self.operation._inbound_nodes.append(self)
+        for kt in self.arguments.keras_tensors:
+            inbound_op = kt._keras_history.operation
+            if inbound_op is not None:  # It's a graph entry point.
+                inbound_op._outbound_nodes.append(self)
+
+        # Set metadata on outputs.
+        if not zero_history:
+            node_index = len(self.operation._inbound_nodes) - 1
+            for i, tensor in enumerate(self.outputs):
+                tensor._keras_history = KerasHistory(
+                    operation=operation, node_index=node_index, tensor_index=i
+                )
+
+        # Whether this is a root node.
+        self.is_input = not self.arguments.keras_tensors
+
+    def __repr__(self):
+        return f"<Node operation={self.operation.name}, id={id(self)}>"
+
+    @property
+    def input_tensors(self):
+        return self.arguments.keras_tensors
+
+    @property
+    def output_tensors(self):
+        return self.outputs
+
+    @property
+    def parent_nodes(self):
+        """The parent `Node`s.
+
+        Returns:
+            all the `Node`s whose output this node immediately depends on.
+        """
+        node_deps = []
+        for kt in self.arguments.keras_tensors:
+            op = kt._keras_history.operation
+            node_index = kt._keras_history.node_index
+            if op is not None:  # `None` for `Input` tensors.
+                node_deps.append(op._inbound_nodes[node_index])
+        return node_deps
+
+
+class KerasHistory(
+    collections.namedtuple(
+        "KerasHistory", ["operation", "node_index", "tensor_index"]
+    )
+):
+    """Tracks the Operation call that created a Tensor.
+
+    During construction of Keras Functions, this metadata is added to
+    each Tensor produced as the output of an Operation.
+    This allows Keras to track how each Tensor was produced, and
+    this information is later retraced by the `Function` class to
+    reconstruct the Operations graph.
+
+    Attributes:
+      operation: The Operation instance that produced the Tensor.
+      node_index: The specific call to the Operation that produced this Tensor.
+        Operations can be called multiple times in order to share weights. A new
+        node is created every time an Operation is called. The corresponding
+        node that represents the call event that produced the Tensor can be
+        found at `op._inbound_nodes[node_index]`.
+      tensor_index: The output index for this Tensor.
+        Always zero if the Operation that produced this Tensor
+        only has one output. Nested structures of
+        Tensors are deterministically assigned an index via `nest.flatten`.
+    """
+
+    # Added to maintain memory and performance characteristics of `namedtuple`
+    # while subclassing.
+    __slots__ = ()
+
+
+def is_keras_tensor(obj):
+    return hasattr(obj, "_keras_history")
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/numpy.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/numpy.py
new file mode 100644
index 0000000000000000000000000000000000000000..cfdcfa7fa681cfe13f741b2ca0231d3d361e8ccc
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/numpy.py
@@ -0,0 +1,6888 @@
+import builtins
+import re
+
+import numpy as np
+
+from keras.src import backend
+from keras.src.api_export import keras_export
+from keras.src.backend import KerasTensor
+from keras.src.backend import any_symbolic_tensors
+from keras.src.backend.common import dtypes
+from keras.src.backend.common.backend_utils import canonicalize_axis
+from keras.src.backend.common.backend_utils import to_tuple_or_list
+from keras.src.ops import operation_utils
+from keras.src.ops.operation import Operation
+from keras.src.ops.operation_utils import broadcast_shapes
+from keras.src.ops.operation_utils import reduce_shape
+
+
+def shape_equal(shape1, shape2, axis=None, allow_none=True):
+    """Check if two shapes are equal.
+
+    Args:
+        shape1: A list or tuple of integers for first shape to be compared.
+        shape2: A list or tuple of integers for second shape to be compared.
+        axis: An integer, list, or tuple of integers (optional):
+            Axes to ignore during comparison. Defaults to `None`.
+        allow_none (bool, optional): If `True`, allows `None` in a shape
+            to match any value in the corresponding position of the other shape.
+            Defaults to `True`.
+
+    Returns:
+        bool: `True` if shapes are considered equal based on the criteria,
+        `False` otherwise.
+
+    Examples:
+
+    >>> shape_equal((32, 64, 128), (32, 64, 128))
+    True
+    >>> shape_equal((32, 64, 128), (32, 64, 127))
+    False
+    >>> shape_equal((32, 64, None), (32, 64, 128), allow_none=True)
+    True
+    >>> shape_equal((32, 64, None), (32, 64, 128), allow_none=False)
+    False
+    >>> shape_equal((32, 64, 128), (32, 63, 128), axis=1)
+    True
+    >>> shape_equal((32, 64, 128), (32, 63, 127), axis=(1, 2))
+    True
+    >>> shape_equal((32, 64, 128), (32, 63, 127), axis=[1,2])
+    True
+    >>> shape_equal((32, 64), (32, 64, 128))
+    False
+    """
+    if len(shape1) != len(shape2):
+        return False
+
+    shape1 = list(shape1)
+    shape2 = list(shape2)
+
+    if axis is not None:
+        if isinstance(axis, int):
+            axis = [axis]
+        for ax in axis:
+            shape1[ax] = -1
+            shape2[ax] = -1
+
+    if allow_none:
+        for i in range(len(shape1)):
+            if shape1[i] is None:
+                shape1[i] = shape2[i]
+            if shape2[i] is None:
+                shape2[i] = shape1[i]
+
+    return shape1 == shape2
+
+
+class Absolute(Operation):
+    def call(self, x):
+        return backend.numpy.absolute(x)
+
+    def compute_output_spec(self, x):
+        sparse = getattr(x, "sparse", False)
+        return KerasTensor(x.shape, dtype=x.dtype, sparse=sparse)
+
+
+@keras_export(["keras.ops.absolute", "keras.ops.numpy.absolute"])
+def absolute(x):
+    """Compute the absolute value element-wise.
+
+    `keras.ops.abs` is a shorthand for this function.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        An array containing the absolute value of each element in `x`.
+
+    Example:
+
+    >>> x = keras.ops.convert_to_tensor([-1.2, 1.2])
+    >>> keras.ops.absolute(x)
+    array([1.2, 1.2], dtype=float32)
+    """
+    if any_symbolic_tensors((x,)):
+        return Absolute().symbolic_call(x)
+    return backend.numpy.absolute(x)
+
+
+class Abs(Absolute):
+    pass
+
+
+@keras_export(["keras.ops.abs", "keras.ops.numpy.abs"])
+def abs(x):
+    """Shorthand for `keras.ops.absolute`."""
+    return absolute(x)
+
+
+class Add(Operation):
+    def call(self, x1, x2):
+        return backend.numpy.add(x1, x2)
+
+    def compute_output_spec(self, x1, x2):
+        x1_shape = getattr(x1, "shape", [])
+        x2_shape = getattr(x2, "shape", [])
+        output_shape = broadcast_shapes(x1_shape, x2_shape)
+        output_dtype = dtypes.result_type(
+            getattr(x1, "dtype", type(x1)),
+            getattr(x2, "dtype", type(x2)),
+        )
+        x1_sparse = getattr(x1, "sparse", False)
+        x2_sparse = getattr(x2, "sparse", False)
+        output_sparse = x1_sparse and x2_sparse
+        return KerasTensor(
+            output_shape, dtype=output_dtype, sparse=output_sparse
+        )
+
+
+@keras_export(["keras.ops.add", "keras.ops.numpy.add"])
+def add(x1, x2):
+    """Add arguments element-wise.
+
+    Args:
+        x1: First input tensor.
+        x2: Second input tensor.
+
+    Returns:
+        The tensor containing the element-wise sum of `x1` and `x2`.
+
+    Examples:
+    >>> x1 = keras.ops.convert_to_tensor([1, 4])
+    >>> x2 = keras.ops.convert_to_tensor([5, 6])
+    >>> keras.ops.add(x1, x2)
+    array([6, 10], dtype=int32)
+
+    `keras.ops.add` also broadcasts shapes:
+    >>> x1 = keras.ops.convert_to_tensor(
+    ...     [[5, 4],
+    ...      [5, 6]]
+    ... )
+    >>> x2 = keras.ops.convert_to_tensor([5, 6])
+    >>> keras.ops.add(x1, x2)
+    array([[10 10]
+           [10 12]], shape=(2, 2), dtype=int32)
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return Add().symbolic_call(x1, x2)
+    return backend.numpy.add(x1, x2)
+
+
+class All(Operation):
+    def __init__(self, axis=None, keepdims=False):
+        super().__init__()
+        if isinstance(axis, int):
+            self.axis = [axis]
+        else:
+            self.axis = axis
+        self.keepdims = keepdims
+
+    def call(self, x):
+        return backend.numpy.all(
+            x,
+            axis=self.axis,
+            keepdims=self.keepdims,
+        )
+
+    def compute_output_spec(self, x):
+        return KerasTensor(
+            reduce_shape(
+                x.shape,
+                axis=self.axis,
+                keepdims=self.keepdims,
+            ),
+            dtype="bool",
+        )
+
+
+@keras_export(["keras.ops.all", "keras.ops.numpy.all"])
+def all(x, axis=None, keepdims=False):
+    """Test whether all array elements along a given axis evaluate to `True`.
+
+    Args:
+        x: Input tensor.
+        axis: An integer or tuple of integers that represent the axis along
+            which a logical AND reduction is performed. The default
+            (`axis=None`) is to perform a logical AND over all the dimensions
+            of the input array. `axis` may be negative, in which case it counts
+            for the last to the first axis.
+        keepdims: If `True`, axes which are reduced are left in the result as
+            dimensions with size one. With this option, the result will
+            broadcast correctly against the input array. Defaults to `False`.
+
+    Returns:
+        The tensor containing the logical AND reduction over the `axis`.
+
+    Examples:
+    >>> x = keras.ops.convert_to_tensor([True, False])
+    >>> keras.ops.all(x)
+    array(False, shape=(), dtype=bool)
+
+    >>> x = keras.ops.convert_to_tensor([[True, False], [True, True]])
+    >>> keras.ops.all(x, axis=0)
+    array([ True False], shape=(2,), dtype=bool)
+
+    `keepdims=True` outputs a tensor with dimensions reduced to one.
+    >>> x = keras.ops.convert_to_tensor([[True, False], [True, True]])
+    >>> keras.ops.all(x, keepdims=True)
+    array([[False]], shape=(1, 1), dtype=bool)
+    """
+    if any_symbolic_tensors((x,)):
+        return All(axis=axis, keepdims=keepdims).symbolic_call(x)
+    return backend.numpy.all(x, axis=axis, keepdims=keepdims)
+
+
+class Any(Operation):
+    def __init__(self, axis=None, keepdims=False):
+        super().__init__()
+        if isinstance(axis, int):
+            self.axis = [axis]
+        else:
+            self.axis = axis
+        self.keepdims = keepdims
+
+    def call(self, x):
+        return backend.numpy.any(
+            x,
+            axis=self.axis,
+            keepdims=self.keepdims,
+        )
+
+    def compute_output_spec(self, x):
+        return KerasTensor(
+            reduce_shape(
+                x.shape,
+                axis=self.axis,
+                keepdims=self.keepdims,
+            ),
+            dtype="bool",
+        )
+
+
+@keras_export(["keras.ops.any", "keras.ops.numpy.any"])
+def any(x, axis=None, keepdims=False):
+    """Test whether any array element along a given axis evaluates to `True`.
+
+    Args:
+        x: Input tensor.
+        axis: An integer or tuple of integers that represent the axis along
+            which a logical OR reduction is performed. The default
+            (`axis=None`) is to perform a logical OR over all the dimensions
+            of the input array. `axis` may be negative, in which case it counts
+            for the last to the first axis.
+        keepdims: If `True`, axes which are reduced are left in the result as
+            dimensions with size one. With this option, the result will
+            broadcast correctly against the input array. Defaults to `False`.
+
+    Returns:
+        The tensor containing the logical OR reduction over the `axis`.
+
+    Examples:
+    >>> x = keras.ops.convert_to_tensor([True, False])
+    >>> keras.ops.any(x)
+    array(True, shape=(), dtype=bool)
+
+    >>> x = keras.ops.convert_to_tensor([[True, False], [True, True]])
+    >>> keras.ops.any(x, axis=0)
+    array([ True  True], shape=(2,), dtype=bool)
+
+    `keepdims=True` outputs a tensor with dimensions reduced to one.
+    >>> x = keras.ops.convert_to_tensor([[True, False], [True, True]])
+    >>> keras.ops.all(x, keepdims=True)
+    array([[False]], shape=(1, 1), dtype=bool)
+    """
+    if any_symbolic_tensors((x,)):
+        return Any(axis=axis, keepdims=keepdims).symbolic_call(x)
+    return backend.numpy.any(x, axis=axis, keepdims=keepdims)
+
+
+class Amax(Operation):
+    def __init__(self, axis=None, keepdims=False):
+        super().__init__()
+        if isinstance(axis, int):
+            axis = [axis]
+        self.axis = axis
+        self.keepdims = keepdims
+
+    def call(self, x):
+        return backend.numpy.amax(
+            x,
+            axis=self.axis,
+            keepdims=self.keepdims,
+        )
+
+    def compute_output_spec(self, x):
+        return KerasTensor(
+            reduce_shape(x.shape, axis=self.axis, keepdims=self.keepdims),
+            dtype=x.dtype,
+        )
+
+
+@keras_export(["keras.ops.amax", "keras.ops.numpy.amax"])
+def amax(x, axis=None, keepdims=False):
+    """Returns the maximum of an array or maximum value along an axis.
+
+    Args:
+        x: Input tensor.
+        axis: Axis along which to compute the maximum.
+            By default (`axis=None`), find the maximum value in all the
+            dimensions of the input array.
+        keepdims: If `True`, axes which are reduced are left in the result as
+            dimensions that are broadcast to the size of the original
+            input tensor. Defaults to `False`.
+
+    Returns:
+        An array with the maximum value. If `axis=None`, the result is a scalar
+        value representing the maximum element in the entire array. If `axis` is
+        given, the result is an array with the maximum values along
+        the specified axis.
+
+    Examples:
+    >>> x = keras.ops.convert_to_tensor([[1, 3, 5], [2, 3, 6]])
+    >>> keras.ops.amax(x)
+    array(6, dtype=int32)
+
+    >>> x = keras.ops.convert_to_tensor([[1, 6, 8], [1, 5, 2]])
+    >>> keras.ops.amax(x, axis=0)
+    array([1, 6, 8], dtype=int32)
+
+    >>> x = keras.ops.convert_to_tensor([[1, 6, 8], [1, 5, 2]])
+    >>> keras.ops.amax(x, axis=1, keepdims=True)
+    array([[8], [5]], dtype=int32)
+    """
+    if any_symbolic_tensors((x,)):
+        return Amax(axis=axis, keepdims=keepdims).symbolic_call(x)
+    return backend.numpy.amax(x, axis=axis, keepdims=keepdims)
+
+
+class Amin(Operation):
+    def __init__(self, axis=None, keepdims=False):
+        super().__init__()
+        if isinstance(axis, int):
+            axis = [axis]
+        self.axis = axis
+        self.keepdims = keepdims
+
+    def call(self, x):
+        return backend.numpy.amin(x, axis=self.axis, keepdims=self.keepdims)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(
+            reduce_shape(x.shape, axis=self.axis, keepdims=self.keepdims),
+            dtype=x.dtype,
+        )
+
+
+@keras_export(["keras.ops.amin", "keras.ops.numpy.amin"])
+def amin(x, axis=None, keepdims=False):
+    """Returns the minimum of an array or minimum value along an axis.
+
+    Args:
+        x: Input tensor.
+        axis: Axis along which to compute the minimum.
+            By default (`axis=None`), find the minimum value in all the
+            dimensions of the input array.
+        keepdims: If `True`, axes which are reduced are left in the result as
+            dimensions that are broadcast to the size of the original
+            input tensor. Defaults to `False`.
+
+    Returns:
+        An array with the minimum value. If `axis=None`, the result is a scalar
+        value representing the minimum element in the entire array. If `axis` is
+        given, the result is an array with the minimum values along
+        the specified axis.
+
+    Examples:
+    >>> x = keras.ops.convert_to_tensor([1, 3, 5, 2, 3, 6])
+    >>> keras.ops.amin(x)
+    array(1, dtype=int32)
+
+    >>> x = keras.ops.convert_to_tensor([[1, 6, 8], [7, 5, 3]])
+    >>> keras.ops.amin(x, axis=0)
+    array([1,5,3], dtype=int32)
+
+    >>> x = keras.ops.convert_to_tensor([[1, 6, 8], [7, 5, 3]])
+    >>> keras.ops.amin(x, axis=1, keepdims=True)
+    array([[1],[3]], dtype=int32)
+    """
+    if any_symbolic_tensors((x,)):
+        return Amin(axis=axis, keepdims=keepdims).symbolic_call(x)
+    return backend.numpy.amin(x, axis=axis, keepdims=keepdims)
+
+
+class Append(Operation):
+    def __init__(self, axis=None):
+        super().__init__()
+        self.axis = axis
+
+    def call(self, x1, x2):
+        return backend.numpy.append(x1, x2, axis=self.axis)
+
+    def compute_output_spec(self, x1, x2):
+        x1_shape = x1.shape
+        x2_shape = x2.shape
+        dtype = dtypes.result_type(
+            getattr(x1, "dtype", type(x1)),
+            getattr(x2, "dtype", type(x2)),
+        )
+        if self.axis is None:
+            if None in x1_shape or None in x2_shape:
+                output_shape = [None]
+            else:
+                output_shape = [int(np.prod(x1_shape) + np.prod(x2_shape))]
+            return KerasTensor(output_shape, dtype=dtype)
+
+        if not shape_equal(x1_shape, x2_shape, [self.axis]):
+            raise ValueError(
+                "`append` requires inputs to have the same shape except the "
+                f"`axis={self.axis}`, but received shape {x1_shape} and "
+                f"{x2_shape}."
+            )
+
+        output_shape = list(x1_shape)
+        output_shape[self.axis] = x1_shape[self.axis] + x2_shape[self.axis]
+        return KerasTensor(output_shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.append", "keras.ops.numpy.append"])
+def append(
+    x1,
+    x2,
+    axis=None,
+):
+    """Append tensor `x2` to the end of tensor `x1`.
+
+    Args:
+        x1: First input tensor.
+        x2: Second input tensor.
+        axis: Axis along which tensor `x2` is appended to tensor `x1`.
+            If `None`, both tensors are flattened before use.
+
+    Returns:
+        A tensor with the values of `x2` appended to `x1`.
+
+    Examples:
+    >>> x1 = keras.ops.convert_to_tensor([1, 2, 3])
+    >>> x2 = keras.ops.convert_to_tensor([[4, 5, 6], [7, 8, 9]])
+    >>> keras.ops.append(x1, x2)
+    array([1, 2, 3, 4, 5, 6, 7, 8, 9], dtype=int32)
+
+    When `axis` is specified, `x1` and `x2` must have compatible shapes.
+    >>> x1 = keras.ops.convert_to_tensor([[1, 2, 3], [4, 5, 6]])
+    >>> x2 = keras.ops.convert_to_tensor([[7, 8, 9]])
+    >>> keras.ops.append(x1, x2, axis=0)
+    array([[1, 2, 3],
+            [4, 5, 6],
+            [7, 8, 9]], dtype=int32)
+    >>> x3 = keras.ops.convert_to_tensor([7, 8, 9])
+    >>> keras.ops.append(x1, x3, axis=0)
+    Traceback (most recent call last):
+        ...
+    TypeError: Cannot concatenate arrays with different numbers of
+    dimensions: got (2, 3), (3,).
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return Append(axis=axis).symbolic_call(x1, x2)
+    return backend.numpy.append(x1, x2, axis=axis)
+
+
+class Arange(Operation):
+    def call(self, start, stop=None, step=1, dtype=None):
+        return backend.numpy.arange(start, stop, step=step, dtype=dtype)
+
+    def compute_output_spec(self, start, stop=None, step=1, dtype=None):
+        if stop is None:
+            start, stop = 0, start
+        output_shape = [int(np.ceil((stop - start) / step))]
+        if dtype is None:
+            dtypes_to_resolve = [
+                getattr(start, "dtype", type(start)),
+                getattr(step, "dtype", type(step)),
+            ]
+            if stop is not None:
+                dtypes_to_resolve.append(getattr(stop, "dtype", type(stop)))
+            dtype = dtypes.result_type(*dtypes_to_resolve)
+        return KerasTensor(output_shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.arange", "keras.ops.numpy.arange"])
+def arange(start, stop=None, step=1, dtype=None):
+    """Return evenly spaced values within a given interval.
+
+    `arange` can be called with a varying number of positional arguments:
+    * `arange(stop)`: Values are generated within the half-open interval
+        `[0, stop)` (in other words, the interval including start but excluding
+        stop).
+    * `arange(start, stop)`: Values are generated within the half-open interval
+        `[start, stop)`.
+    * `arange(start, stop, step)`: Values are generated within the half-open
+        interval `[start, stop)`, with spacing between values given by step.
+
+    Args:
+        start: Integer or real, representing the start of the interval. The
+            interval includes this value.
+        stop: Integer or real, representing the end of the interval. The
+            interval does not include this value, except in some cases where
+            `step` is not an integer and floating point round-off affects the
+            length of `out`. Defaults to `None`.
+        step: Integer or real, represent the spacing between values. For any
+            output `out`, this is the distance between two adjacent values,
+            `out[i+1] - out[i]`. The default step size is 1. If `step` is
+            specified as a position argument, `start` must also be given.
+        dtype: The type of the output array. If `dtype` is not given, infer the
+            data type from the other input arguments.
+
+    Returns:
+        Tensor of evenly spaced values.
+        For floating point arguments, the length of the result is
+        `ceil((stop - start)/step)`. Because of floating point overflow, this
+        rule may result in the last element of out being greater than stop.
+
+    Examples:
+    >>> keras.ops.arange(3)
+    array([0, 1, 2], dtype=int32)
+
+    >>> keras.ops.arange(3.0)
+    array([0., 1., 2.], dtype=float32)
+
+    >>> keras.ops.arange(3, 7)
+    array([3, 4, 5, 6], dtype=int32)
+
+    >>> keras.ops.arange(3, 7, 2)
+    array([3, 5], dtype=int32)
+    """
+    return backend.numpy.arange(start, stop, step=step, dtype=dtype)
+
+
+class Arccos(Operation):
+    def call(self, x):
+        return backend.numpy.arccos(x)
+
+    def compute_output_spec(self, x):
+        dtype = backend.standardize_dtype(getattr(x, "dtype", backend.floatx()))
+        if dtype == "int64":
+            dtype = backend.floatx()
+        else:
+            dtype = dtypes.result_type(dtype, float)
+        return KerasTensor(x.shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.arccos", "keras.ops.numpy.arccos"])
+def arccos(x):
+    """Trigonometric inverse cosine, element-wise.
+
+    The inverse of `cos` so that, if `y = cos(x)`, then `x = arccos(y)`.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        Tensor of the angle of the ray intersecting the unit circle at the given
+        x-coordinate in radians `[0, pi]`.
+
+    Example:
+    >>> x = keras.ops.convert_to_tensor([1, -1])
+    >>> keras.ops.arccos(x)
+    array([0.0, 3.1415927], dtype=float32)
+    """
+    if any_symbolic_tensors((x,)):
+        return Arccos().symbolic_call(x)
+    return backend.numpy.arccos(x)
+
+
+class Arccosh(Operation):
+    def call(self, x):
+        return backend.numpy.arccosh(x)
+
+    def compute_output_spec(self, x):
+        dtype = backend.standardize_dtype(getattr(x, "dtype", backend.floatx()))
+        if dtype == "int64":
+            dtype = backend.floatx()
+        else:
+            dtype = dtypes.result_type(dtype, float)
+        return KerasTensor(x.shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.arccosh", "keras.ops.numpy.arccosh"])
+def arccosh(x):
+    """Inverse hyperbolic cosine, element-wise.
+
+    Arguments:
+        x: Input tensor.
+
+    Returns:
+        Output tensor of same shape as x.
+
+    Example:
+    >>> x = keras.ops.convert_to_tensor([10, 100])
+    >>> keras.ops.arccosh(x)
+    array([2.993223, 5.298292], dtype=float32)
+    """
+    if any_symbolic_tensors((x,)):
+        return Arccosh().symbolic_call(x)
+    return backend.numpy.arccosh(x)
+
+
+class Arcsin(Operation):
+    def call(self, x):
+        return backend.numpy.arcsin(x)
+
+    def compute_output_spec(self, x):
+        dtype = backend.standardize_dtype(getattr(x, "dtype", backend.floatx()))
+        if dtype == "int64":
+            dtype = backend.floatx()
+        else:
+            dtype = dtypes.result_type(dtype, float)
+        sparse = getattr(x, "sparse", False)
+        return KerasTensor(x.shape, dtype=dtype, sparse=sparse)
+
+
+@keras_export(["keras.ops.arcsin", "keras.ops.numpy.arcsin"])
+def arcsin(x):
+    """Inverse sine, element-wise.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        Tensor of the inverse sine of each element in `x`, in radians and in
+        the closed interval `[-pi/2, pi/2]`.
+
+    Example:
+    >>> x = keras.ops.convert_to_tensor([1, -1, 0])
+    >>> keras.ops.arcsin(x)
+    array([ 1.5707964, -1.5707964,  0.], dtype=float32)
+    """
+    if any_symbolic_tensors((x,)):
+        return Arcsin().symbolic_call(x)
+    return backend.numpy.arcsin(x)
+
+
+class Arcsinh(Operation):
+    def call(self, x):
+        return backend.numpy.arcsinh(x)
+
+    def compute_output_spec(self, x):
+        dtype = backend.standardize_dtype(getattr(x, "dtype", backend.floatx()))
+        if dtype == "int64":
+            dtype = backend.floatx()
+        else:
+            dtype = dtypes.result_type(dtype, float)
+        sparse = getattr(x, "sparse", False)
+        return KerasTensor(x.shape, dtype=dtype, sparse=sparse)
+
+
+@keras_export(["keras.ops.arcsinh", "keras.ops.numpy.arcsinh"])
+def arcsinh(x):
+    """Inverse hyperbolic sine, element-wise.
+
+    Arguments:
+        x: Input tensor.
+
+    Returns:
+        Output tensor of same shape as `x`.
+
+    Example:
+    >>> x = keras.ops.convert_to_tensor([1, -1, 0])
+    >>> keras.ops.arcsinh(x)
+    array([0.88137364, -0.88137364, 0.0], dtype=float32)
+    """
+    if any_symbolic_tensors((x,)):
+        return Arcsinh().symbolic_call(x)
+    return backend.numpy.arcsinh(x)
+
+
+class Arctan(Operation):
+    def call(self, x):
+        return backend.numpy.arctan(x)
+
+    def compute_output_spec(self, x):
+        dtype = backend.standardize_dtype(getattr(x, "dtype", backend.floatx()))
+        if dtype == "int64":
+            dtype = backend.floatx()
+        else:
+            dtype = dtypes.result_type(dtype, float)
+        sparse = getattr(x, "sparse", False)
+        return KerasTensor(x.shape, dtype=dtype, sparse=sparse)
+
+
+@keras_export(["keras.ops.arctan", "keras.ops.numpy.arctan"])
+def arctan(x):
+    """Trigonometric inverse tangent, element-wise.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        Tensor of the inverse tangent of each element in `x`, in the interval
+        `[-pi/2, pi/2]`.
+
+    Example:
+    >>> x = keras.ops.convert_to_tensor([0, 1])
+    >>> keras.ops.arctan(x)
+    array([0., 0.7853982], dtype=float32)
+    """
+    if any_symbolic_tensors((x,)):
+        return Arctan().symbolic_call(x)
+    return backend.numpy.arctan(x)
+
+
+class Arctan2(Operation):
+    def call(self, x1, x2):
+        return backend.numpy.arctan2(x1, x2)
+
+    def compute_output_spec(self, x1, x2):
+        x1_shape = getattr(x1, "shape", [])
+        x2_shape = getattr(x2, "shape", [])
+        outputs_shape = broadcast_shapes(x1_shape, x2_shape)
+        x1_dtype = backend.standardize_dtype(
+            getattr(x1, "dtype", backend.floatx())
+        )
+        x2_dtype = backend.standardize_dtype(
+            getattr(x2, "dtype", backend.floatx())
+        )
+        dtype = dtypes.result_type(x1_dtype, x2_dtype, float)
+        return KerasTensor(outputs_shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.arctan2", "keras.ops.numpy.arctan2"])
+def arctan2(x1, x2):
+    """Element-wise arc tangent of `x1/x2` choosing the quadrant correctly.
+
+    The quadrant (i.e., branch) is chosen so that `arctan2(x1, x2)` is the
+    signed angle in radians between the ray ending at the origin and passing
+    through the point `(1, 0)`, and the ray ending at the origin and passing
+    through the point `(x2, x1)`. (Note the role reversal: the "y-coordinate"
+    is the first function parameter, the "x-coordinate" is the second.) By IEEE
+    convention, this function is defined for `x2 = +/-0` and for either or both
+    of `x1` and `x2` `= +/-inf`.
+
+    Args:
+        x1: First input tensor.
+        x2: Second input tensor.
+
+    Returns:
+        Tensor of angles in radians, in the range `[-pi, pi]`.
+
+    Examples:
+    Consider four points in different quadrants:
+    >>> x = keras.ops.convert_to_tensor([-1, +1, +1, -1])
+    >>> y = keras.ops.convert_to_tensor([-1, -1, +1, +1])
+    >>> keras.ops.arctan2(y, x) * 180 / numpy.pi
+    array([-135., -45., 45., 135.], dtype=float32)
+
+    Note the order of the parameters. `arctan2` is defined also when x2=0 and
+    at several other points, obtaining values in the range `[-pi, pi]`:
+    >>> keras.ops.arctan2(
+    ...     keras.ops.array([1., -1.]),
+    ...     keras.ops.array([0., 0.]),
+    ... )
+    array([ 1.5707964, -1.5707964], dtype=float32)
+    >>> keras.ops.arctan2(
+    ...     keras.ops.array([0., 0., numpy.inf]),
+    ...     keras.ops.array([+0., -0., numpy.inf]),
+    ... )
+    array([0., 3.1415925, 0.7853982], dtype=float32)
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return Arctan2().symbolic_call(x1, x2)
+    return backend.numpy.arctan2(x1, x2)
+
+
+class Arctanh(Operation):
+    def call(self, x):
+        return backend.numpy.arctanh(x)
+
+    def compute_output_spec(self, x):
+        dtype = backend.standardize_dtype(getattr(x, "dtype", backend.floatx()))
+        if dtype == "int64":
+            dtype = backend.floatx()
+        else:
+            dtype = dtypes.result_type(dtype, float)
+        sparse = getattr(x, "sparse", False)
+        return KerasTensor(x.shape, dtype=dtype, sparse=sparse)
+
+
+@keras_export(["keras.ops.arctanh", "keras.ops.numpy.arctanh"])
+def arctanh(x):
+    """Inverse hyperbolic tangent, element-wise.
+
+    Arguments:
+        x: Input tensor.
+
+    Returns:
+        Output tensor of same shape as `x`.
+    """
+    if any_symbolic_tensors((x,)):
+        return Arctanh().symbolic_call(x)
+    return backend.numpy.arctanh(x)
+
+
+class Argmax(Operation):
+    def __init__(self, axis=None, keepdims=False):
+        super().__init__()
+        self.axis = axis
+        self.keepdims = keepdims
+
+    def call(self, x):
+        return backend.numpy.argmax(x, axis=self.axis, keepdims=self.keepdims)
+
+    def compute_output_spec(self, x):
+        if self.keepdims:
+            return KerasTensor(x.shape, dtype="int32")
+        if self.axis is None:
+            return KerasTensor([], dtype="int32")
+        return KerasTensor(
+            reduce_shape(x.shape, axis=[self.axis]), dtype="int32"
+        )
+
+
+@keras_export(["keras.ops.argmax", "keras.ops.numpy.argmax"])
+def argmax(x, axis=None, keepdims=False):
+    """Returns the indices of the maximum values along an axis.
+
+    Args:
+        x: Input tensor.
+        axis: By default, the index is into the flattened tensor, otherwise
+            along the specified axis.
+        keepdims: If this is set to `True`, the axes which are reduced are left
+            in the result as dimensions with size one. Defaults to `False`.
+
+    Returns:
+        Tensor of indices. It has the same shape as `x`, with the dimension
+        along `axis` removed.
+
+    Example:
+    >>> x = keras.ops.arange(6).reshape(2, 3) + 10
+    >>> x
+    array([[10, 11, 12],
+           [13, 14, 15]], dtype=int32)
+    >>> keras.ops.argmax(x)
+    array(5, dtype=int32)
+    >>> keras.ops.argmax(x, axis=0)
+    array([1, 1, 1], dtype=int32)
+    >>> keras.ops.argmax(x, axis=1)
+    array([2, 2], dtype=int32)
+    """
+    if any_symbolic_tensors((x,)):
+        return Argmax(axis=axis, keepdims=keepdims).symbolic_call(x)
+    return backend.numpy.argmax(x, axis=axis, keepdims=keepdims)
+
+
+class Argmin(Operation):
+    def __init__(self, axis=None, keepdims=False):
+        super().__init__()
+        self.axis = axis
+        self.keepdims = keepdims
+
+    def call(self, x):
+        return backend.numpy.argmin(x, axis=self.axis, keepdims=self.keepdims)
+
+    def compute_output_spec(self, x):
+        if self.keepdims:
+            return KerasTensor(x.shape, dtype="int32")
+        if self.axis is None:
+            return KerasTensor([], dtype="int32")
+        return KerasTensor(
+            reduce_shape(x.shape, axis=[self.axis]), dtype="int32"
+        )
+
+
+@keras_export(["keras.ops.argmin", "keras.ops.numpy.argmin"])
+def argmin(x, axis=None, keepdims=False):
+    """Returns the indices of the minimum values along an axis.
+
+    Args:
+        x: Input tensor.
+        axis: By default, the index is into the flattened tensor, otherwise
+            along the specified axis.
+        keepdims: If this is set to `True`, the axes which are reduced are left
+            in the result as dimensions with size one. Defaults to `False`.
+
+    Returns:
+        Tensor of indices. It has the same shape as `x`, with the dimension
+        along `axis` removed.
+
+    Example:
+    >>> x = keras.ops.arange(6).reshape(2, 3) + 10
+    >>> x
+    array([[10, 11, 12],
+           [13, 14, 15]], dtype=int32)
+    >>> keras.ops.argmin(x)
+    array(0, dtype=int32)
+    >>> keras.ops.argmin(x, axis=0)
+    array([0, 0, 0], dtype=int32)
+    >>> keras.ops.argmin(x, axis=1)
+    array([0, 0], dtype=int32)
+    """
+    if any_symbolic_tensors((x,)):
+        return Argmin(axis=axis, keepdims=keepdims).symbolic_call(x)
+    return backend.numpy.argmin(x, axis=axis, keepdims=keepdims)
+
+
+class Argsort(Operation):
+    def __init__(self, axis=-1):
+        super().__init__()
+        self.axis = axis
+
+    def call(self, x):
+        return backend.numpy.argsort(x, axis=self.axis)
+
+    def compute_output_spec(self, x):
+        if self.axis is None:
+            return KerasTensor([int(np.prod(x.shape))], dtype="int32")
+        return KerasTensor(x.shape, dtype="int32")
+
+
+@keras_export(["keras.ops.argsort", "keras.ops.numpy.argsort"])
+def argsort(x, axis=-1):
+    """Returns the indices that would sort a tensor.
+
+    Args:
+        x: Input tensor.
+        axis: Axis along which to sort. Defaults to `-1` (the last axis). If
+            `None`, the flattened tensor is used.
+
+    Returns:
+        Tensor of indices that sort `x` along the specified `axis`.
+
+    Examples:
+    One dimensional array:
+    >>> x = keras.ops.array([3, 1, 2])
+    >>> keras.ops.argsort(x)
+    array([1, 2, 0], dtype=int32)
+
+    Two-dimensional array:
+    >>> x = keras.ops.array([[0, 3], [3, 2], [4, 5]])
+    >>> x
+    array([[0, 3],
+           [3, 2],
+           [4, 5]], dtype=int32)
+    >>> keras.ops.argsort(x, axis=0)
+    array([[0, 1],
+           [1, 0],
+           [2, 2]], dtype=int32)
+    >>> keras.ops.argsort(x, axis=1)
+    array([[0, 1],
+           [1, 0],
+           [0, 1]], dtype=int32)
+    """
+    if any_symbolic_tensors((x,)):
+        return Argsort(axis=axis).symbolic_call(x)
+    return backend.numpy.argsort(x, axis=axis)
+
+
+class Array(Operation):
+    def call(self, x, dtype=None):
+        return backend.numpy.array(x, dtype=dtype)
+
+    def compute_output_spec(self, x, dtype=None):
+        return KerasTensor(x.shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.array", "keras.ops.numpy.array"])
+def array(x, dtype=None):
+    """Create a tensor.
+
+    Args:
+        x: Input tensor.
+        dtype: The desired data-type for the tensor.
+
+    Returns:
+        A tensor.
+
+    Examples:
+    >>> keras.ops.array([1, 2, 3])
+    array([1, 2, 3], dtype=int32)
+
+    >>> keras.ops.array([1, 2, 3], dtype="float32")
+    array([1., 2., 3.], dtype=float32)
+    """
+    if any_symbolic_tensors((x,)):
+        return Array().symbolic_call(x, dtype=dtype)
+    return backend.numpy.array(x, dtype=dtype)
+
+
+class Average(Operation):
+    def __init__(self, axis=None):
+        super().__init__()
+        # np.average() does not support axis as tuple as declared by the
+        # docstring, it only supports int or None.
+        self.axis = axis
+
+    def call(self, x, weights=None):
+        return backend.numpy.average(x, weights=weights, axis=self.axis)
+
+    def compute_output_spec(self, x, weights=None):
+        dtypes_to_resolve = [getattr(x, "dtype", type(x)), float]
+        if weights is not None:
+            shape_match = shape_equal(x.shape, weights.shape, allow_none=True)
+            if self.axis is not None:
+                shape_match_on_axis = shape_equal(
+                    [x.shape[self.axis]], weights.shape, allow_none=True
+                )
+            dtypes_to_resolve.append(getattr(weights, "dtype", type(weights)))
+        dtype = dtypes.result_type(*dtypes_to_resolve)
+        if self.axis is None:
+            if weights is None or shape_match:
+                return KerasTensor([], dtype=dtype)
+            else:
+                raise ValueError(
+                    "`weights` must have the same shape as `x` when "
+                    f"`axis=None`, but received `weights.shape={weights.shape}`"
+                    f" and `x.shape={x.shape}`."
+                )
+
+        if weights is None or shape_match_on_axis or shape_match:
+            return KerasTensor(
+                reduce_shape(x.shape, axis=[self.axis]), dtype=dtype
+            )
+        else:
+            # `weights` can either be a 1D array of length `x.shape[axis]` or
+            # of the same shape as `x`.
+            raise ValueError(
+                "`weights` must have the same size as `x` at "
+                f"`axis={self.axis}` but received "
+                f"`weights.shape={weights.shape}` while x.shape at "
+                f"`{self.axis}` is `{x.shape[self.axis]}`."
+            )
+
+
+@keras_export(["keras.ops.average", "keras.ops.numpy.average"])
+def average(x, axis=None, weights=None):
+    """Compute the weighted average along the specified axis.
+
+    Args:
+        x: Input tensor.
+        axis: Integer along which to average `x`. The default, `axis=None`,
+            will average over all of the elements of the input tensor. If axis
+            is negative it counts from the last to the first axis.
+        weights: Tensor of weights associated with the values in `x`. Each
+            value in `x` contributes to the average according to its
+            associated weight. The weights array can either be 1-D (in which
+            case its length must be the size of a along the given axis) or of
+            the same shape as `x`. If `weights=None` (default), then all data
+            in `x` are assumed to have a weight equal to one.
+
+            The 1-D calculation is: `avg = sum(a * weights) / sum(weights)`.
+            The only constraint on weights is that `sum(weights)` must not be 0.
+
+    Returns:
+        Return the average along the specified axis.
+
+    Examples:
+    >>> data = keras.ops.arange(1, 5)
+    >>> data
+    array([1, 2, 3, 4], dtype=int32)
+    >>> keras.ops.average(data)
+    array(2.5, dtype=float32)
+    >>> keras.ops.average(
+    ...     keras.ops.arange(1, 11),
+    ...     weights=keras.ops.arange(10, 0, -1)
+    ... )
+    array(4., dtype=float32)
+
+    >>> data = keras.ops.arange(6).reshape((3, 2))
+    >>> data
+    array([[0, 1],
+           [2, 3],
+           [4, 5]], dtype=int32)
+    >>> keras.ops.average(
+    ...     data,
+    ...     axis=1,
+    ...     weights=keras.ops.array([1./4, 3./4])
+    ... )
+    array([0.75, 2.75, 4.75], dtype=float32)
+    >>> keras.ops.average(
+    ...     data,
+    ...     weights=keras.ops.array([1./4, 3./4])
+    ... )
+    Traceback (most recent call last):
+        ...
+    ValueError: Axis must be specified when shapes of a and weights differ.
+    """
+    if any_symbolic_tensors((x,)):
+        return Average(axis=axis).symbolic_call(x, weights=weights)
+    return backend.numpy.average(x, weights=weights, axis=axis)
+
+
+class Bincount(Operation):
+    def __init__(self, weights=None, minlength=0, sparse=False):
+        super().__init__()
+        self.weights = weights
+        self.minlength = minlength
+        self.sparse = sparse
+
+    def call(self, x):
+        return backend.numpy.bincount(
+            x,
+            weights=self.weights,
+            minlength=self.minlength,
+            sparse=self.sparse,
+        )
+
+    def compute_output_spec(self, x):
+        dtypes_to_resolve = [x.dtype]
+        if self.weights is not None:
+            weights = backend.convert_to_tensor(self.weights)
+            dtypes_to_resolve.append(weights.dtype)
+            dtype = dtypes.result_type(*dtypes_to_resolve)
+        else:
+            dtype = "int32"
+        x_sparse = getattr(x, "sparse", False)
+        return KerasTensor(
+            list(x.shape[:-1]) + [None],
+            dtype=dtype,
+            sparse=x_sparse or self.sparse,
+        )
+
+
+@keras_export(["keras.ops.bincount", "keras.ops.numpy.bincount"])
+def bincount(x, weights=None, minlength=0, sparse=False):
+    """Count the number of occurrences of each value in a tensor of integers.
+
+    Args:
+        x: Input tensor.
+            It must be of dimension 1, and it must only contain non-negative
+            integer(s).
+        weights: Weight tensor.
+            It must have the same length as `x`. The default value is `None`.
+            If specified, `x` is weighted by it, i.e. if `n = x[i]`,
+            `out[n] += weight[i]` instead of the default behavior `out[n] += 1`.
+        minlength: An integer.
+            The default value is 0. If specified, there will be at least
+            this number of bins in the output tensor. If greater than
+            `max(x) + 1`, each value of the output at an index higher than
+            `max(x)` is set to 0.
+        sparse: Whether to return a sparse tensor; for backends that support
+            sparse tensors.
+
+    Returns:
+        1D tensor where each element gives the number of occurrence(s) of its
+        index value in x. Its length is the maximum between `max(x) + 1` and
+        minlength.
+
+    Examples:
+    >>> x = keras.ops.array([1, 2, 2, 3], dtype="uint8")
+    >>> keras.ops.bincount(x)
+    array([0, 1, 2, 1], dtype=int32)
+    >>> weights = x / 2
+    >>> weights
+    array([0.5, 1., 1., 1.5], dtype=float64)
+    >>> keras.ops.bincount(x, weights=weights)
+    array([0., 0.5, 2., 1.5], dtype=float64)
+    >>> minlength = (keras.ops.max(x).numpy() + 1) + 2 # 6
+    >>> keras.ops.bincount(x, minlength=minlength)
+    array([0, 1, 2, 1, 0, 0], dtype=int32)
+    """
+    if any_symbolic_tensors((x,)):
+        return Bincount(
+            weights=weights, minlength=minlength, sparse=sparse
+        ).symbolic_call(x)
+    return backend.numpy.bincount(
+        x, weights=weights, minlength=minlength, sparse=sparse
+    )
+
+
+class BitwiseAnd(Operation):
+    def __init__(self):
+        super().__init__()
+
+    def call(self, x, y):
+        return backend.numpy.bitwise_and(x, y)
+
+    def compute_output_spec(self, x, y):
+        dtype = dtypes.result_type(x.dtype, y.dtype)
+        return KerasTensor(x.shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.bitwise_and", "keras.ops.numpy.bitwise_and"])
+def bitwise_and(x, y):
+    """Compute the bit-wise AND of two arrays element-wise.
+
+    Computes the bit-wise AND of the underlying binary representation of the
+    integers in the input arrays. This ufunc implements the C/Python operator
+    `&`.
+
+    Args:
+        x: Input integer tensor.
+        y: Input integer tensor.
+
+    Returns:
+        Result tensor.
+    """
+    if any_symbolic_tensors((x, y)):
+        return BitwiseAnd().symbolic_call(x, y)
+    return backend.numpy.bitwise_and(x, y)
+
+
+class BitwiseInvert(Operation):
+    def __init__(self):
+        super().__init__()
+
+    def call(self, x):
+        return backend.numpy.bitwise_invert(x)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.bitwise_invert", "keras.ops.numpy.bitwise_invert"])
+def bitwise_invert(x):
+    """Compute bit-wise inversion, or bit-wise NOT, element-wise.
+
+    Computes the bit-wise NOT of the underlying binary representation of the
+    integers in the input arrays. This ufunc implements the C/Python operator
+    `~`.
+
+    Args:
+        x: Input integer tensor.
+
+    Returns:
+        Result tensor.
+    """
+    if any_symbolic_tensors((x,)):
+        return BitwiseInvert().symbolic_call(x)
+    return backend.numpy.bitwise_invert(x)
+
+
+class BitwiseNot(Operation):
+    def __init__(self):
+        super().__init__()
+
+    def call(self, x):
+        return backend.numpy.bitwise_not(x)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.bitwise_not", "keras.ops.numpy.bitwise_not"])
+def bitwise_not(x):
+    """Compute bit-wise inversion, or bit-wise NOT, element-wise.
+
+    Computes the bit-wise NOT of the underlying binary representation of the
+    integers in the input arrays. This ufunc implements the C/Python operator
+    `~`.
+
+    Args:
+        x: Input integer tensor.
+
+    Returns:
+        Result tensor.
+    """
+    if any_symbolic_tensors((x,)):
+        return BitwiseNot().symbolic_call(x)
+    return backend.numpy.bitwise_not(x)
+
+
+class BitwiseOr(Operation):
+    def __init__(self):
+        super().__init__()
+
+    def call(self, x, y):
+        return backend.numpy.bitwise_or(x, y)
+
+    def compute_output_spec(self, x, y):
+        dtype = dtypes.result_type(x.dtype, y.dtype)
+        return KerasTensor(x.shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.bitwise_or", "keras.ops.numpy.bitwise_or"])
+def bitwise_or(x, y):
+    """Compute the bit-wise OR of two arrays element-wise.
+
+    Computes the bit-wise OR of the underlying binary representation of the
+    integers in the input arrays. This ufunc implements the C/Python operator
+    `|`.
+
+    Args:
+        x: Input integer tensor.
+        y: Input integer tensor.
+
+    Returns:
+        Result tensor.
+    """
+    if any_symbolic_tensors((x, y)):
+        return BitwiseOr().symbolic_call(x, y)
+    return backend.numpy.bitwise_or(x, y)
+
+
+class BitwiseXor(Operation):
+    def __init__(self):
+        super().__init__()
+
+    def call(self, x, y):
+        return backend.numpy.bitwise_xor(x, y)
+
+    def compute_output_spec(self, x, y):
+        dtype = dtypes.result_type(x.dtype, y.dtype)
+        return KerasTensor(x.shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.bitwise_xor", "keras.ops.numpy.bitwise_xor"])
+def bitwise_xor(x, y):
+    """Compute the bit-wise XOR of two arrays element-wise.
+
+    Computes the bit-wise XOR of the underlying binary representation of the
+    integers in the input arrays. This ufunc implements the C/Python operator
+    `^`.
+
+    Args:
+        x: Input integer tensor.
+        y: Input integer tensor.
+
+    Returns:
+        Result tensor.
+    """
+    if any_symbolic_tensors((x, y)):
+        return BitwiseXor().symbolic_call(x, y)
+    return backend.numpy.bitwise_xor(x, y)
+
+
+class BitwiseLeftShift(Operation):
+    def __init__(self):
+        super().__init__()
+
+    def call(self, x, y):
+        return backend.numpy.bitwise_left_shift(x, y)
+
+    def compute_output_spec(self, x, y):
+        dtype = dtypes.result_type(x.dtype, y.dtype)
+        return KerasTensor(x.shape, dtype=dtype)
+
+
+@keras_export(
+    ["keras.ops.bitwise_left_shift", "keras.ops.numpy.bitwise_left_shift"]
+)
+def bitwise_left_shift(x, y):
+    """Shift the bits of an integer to the left.
+
+    Bits are shifted to the left by appending `y` 0s at the right of `x`.
+    Since the internal representation of numbers is in binary format, this
+    operation is equivalent to multiplying `x` by `2**y`.
+
+    Args:
+        x: Input integer tensor.
+        y: Input integer tensor.
+
+    Returns:
+        Result tensor.
+    """
+    if any_symbolic_tensors((x, y)):
+        return BitwiseLeftShift().symbolic_call(x, y)
+    return backend.numpy.bitwise_left_shift(x, y)
+
+
+class LeftShift(Operation):
+    def __init__(self):
+        super().__init__()
+
+    def call(self, x, y):
+        return backend.numpy.left_shift(x, y)
+
+    def compute_output_spec(self, x, y):
+        dtype = dtypes.result_type(x.dtype, y.dtype)
+        return KerasTensor(x.shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.left_shift", "keras.ops.numpy.left_shift"])
+def left_shift(x, y):
+    """Shift the bits of an integer to the left.
+
+    Bits are shifted to the left by appending `y` 0s at the right of `x`.
+    Since the internal representation of numbers is in binary format, this
+    operation is equivalent to multiplying `x` by `2**y`.
+
+    Args:
+        x: Input integer tensor.
+        y: Input integer tensor.
+
+    Returns:
+        Result tensor.
+    """
+    if any_symbolic_tensors((x, y)):
+        return LeftShift().symbolic_call(x, y)
+    return backend.numpy.left_shift(x, y)
+
+
+class BitwiseRightShift(Operation):
+    def __init__(self):
+        super().__init__()
+
+    def call(self, x, y):
+        return backend.numpy.bitwise_right_shift(x, y)
+
+    def compute_output_spec(self, x, y):
+        dtype = dtypes.result_type(x.dtype, y.dtype)
+        return KerasTensor(x.shape, dtype=dtype)
+
+
+@keras_export(
+    ["keras.ops.bitwise_right_shift", "keras.ops.numpy.bitwise_right_shift"]
+)
+def bitwise_right_shift(x, y):
+    """Shift the bits of an integer to the right.
+
+    Bits are shifted to the right `y`. Because the internal representation of
+    numbers is in binary format, this operation is equivalent to dividing `x` by
+    `2**y`.
+
+    Args:
+        x: Input integer tensor.
+        y: Input integer tensor.
+
+    Returns:
+        Result tensor.
+    """
+    if any_symbolic_tensors((x, y)):
+        return BitwiseRightShift().symbolic_call(x, y)
+    return backend.numpy.bitwise_right_shift(x, y)
+
+
+class RightShift(Operation):
+    def __init__(self):
+        super().__init__()
+
+    def call(self, x, y):
+        return backend.numpy.right_shift(x, y)
+
+    def compute_output_spec(self, x, y):
+        dtype = dtypes.result_type(x.dtype, y.dtype)
+        return KerasTensor(x.shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.right_shift", "keras.ops.numpy.right_shift"])
+def right_shift(x, y):
+    """Shift the bits of an integer to the right.
+
+    Bits are shifted to the right `y`. Because the internal representation of
+    numbers is in binary format, this operation is equivalent to dividing `x` by
+    `2**y`.
+
+    Args:
+        x: Input integer tensor.
+        y: Input integer tensor.
+
+    Returns:
+        Result tensor.
+    """
+    if any_symbolic_tensors((x, y)):
+        return RightShift().symbolic_call(x, y)
+    return backend.numpy.right_shift(x, y)
+
+
+class BroadcastTo(Operation):
+    def __init__(self, shape):
+        super().__init__()
+        self.shape = shape
+
+    def call(self, x):
+        return backend.numpy.broadcast_to(x, self.shape)
+
+    def compute_output_spec(self, x):
+        # Catch broadcasting errors for clear error messages.
+        broadcast_shapes(x.shape, self.shape)
+        return KerasTensor(self.shape, dtype=x.dtype)
+
+
+@keras_export(
+    [
+        "keras.ops.broadcast_to",
+        "keras.ops.numpy.broadcast_to",
+    ]
+)
+def broadcast_to(x, shape):
+    """Broadcast a tensor to a new shape.
+
+    Args:
+        x: The tensor to broadcast.
+        shape: The shape of the desired tensor. A single integer `i` is
+            interpreted as `(i,)`.
+
+    Returns:
+        A tensor with the desired shape.
+
+    Examples:
+    >>> x = keras.ops.array([1, 2, 3])
+    >>> keras.ops.broadcast_to(x, (3, 3))
+    array([[1, 2, 3],
+           [1, 2, 3],
+           [1, 2, 3]])
+    """
+    if any_symbolic_tensors((x,)):
+        return BroadcastTo(shape=shape).symbolic_call(x)
+    return backend.numpy.broadcast_to(x, shape)
+
+
+class Ceil(Operation):
+    def call(self, x):
+        return backend.numpy.ceil(x)
+
+    def compute_output_spec(self, x):
+        if backend.standardize_dtype(x.dtype) == "int64":
+            dtype = backend.floatx()
+        else:
+            dtype = dtypes.result_type(x.dtype, float)
+        sparse = getattr(x, "sparse", False)
+        return KerasTensor(x.shape, dtype=dtype, sparse=sparse)
+
+
+@keras_export(["keras.ops.ceil", "keras.ops.numpy.ceil"])
+def ceil(x):
+    """Return the ceiling of the input, element-wise.
+
+    The ceil of the scalar `x` is the smallest integer `i`, such that
+    `i >= x`.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        The ceiling of each element in `x`, with float dtype.
+    """
+    if any_symbolic_tensors((x,)):
+        return Ceil().symbolic_call(x)
+    return backend.numpy.ceil(x)
+
+
+class Clip(Operation):
+    def __init__(self, x_min, x_max):
+        super().__init__()
+        self.x_min = x_min
+        self.x_max = x_max
+
+    def call(self, x):
+        return backend.numpy.clip(x, self.x_min, self.x_max)
+
+    def compute_output_spec(self, x):
+        dtype = backend.standardize_dtype(x.dtype)
+        if dtype == "bool":
+            dtype = "int32"
+        return KerasTensor(x.shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.clip", "keras.ops.numpy.clip"])
+def clip(x, x_min, x_max):
+    """Clip (limit) the values in a tensor.
+
+    Given an interval, values outside the interval are clipped to the
+    interval edges. For example, if an interval of `[0, 1]` is specified,
+    values smaller than 0 become 0, and values larger than 1 become 1.
+
+    Args:
+        x: Input tensor.
+        x_min: Minimum value.
+        x_max: Maximum value.
+    Returns:
+        The clipped tensor.
+    """
+    if any_symbolic_tensors((x,)):
+        return Clip(x_min, x_max).symbolic_call(x)
+    return backend.numpy.clip(x, x_min, x_max)
+
+
+class Concatenate(Operation):
+    def __init__(self, axis=0):
+        super().__init__()
+        if axis is None:
+            raise ValueError("`axis` cannot be None for `concatenate`.")
+        self.axis = axis
+
+    def call(self, xs):
+        return backend.numpy.concatenate(xs, axis=self.axis)
+
+    def compute_output_spec(self, xs):
+        first_shape = xs[0].shape
+        total_size_on_axis = 0
+        all_sparse = True
+        dtypes_to_resolve = []
+        for x in xs:
+            if not shape_equal(
+                x.shape, first_shape, axis=[self.axis], allow_none=True
+            ):
+                raise ValueError(
+                    "Every value in `xs` must have the same shape except on "
+                    f"the `axis` dim. But found element of shape {x.shape}, "
+                    f"which is different from the first element's "
+                    f"shape {first_shape}."
+                )
+            if total_size_on_axis is None or x.shape[self.axis] is None:
+                total_size_on_axis = None
+            else:
+                total_size_on_axis += x.shape[self.axis]
+            all_sparse = all_sparse and getattr(x, "sparse", False)
+            dtypes_to_resolve.append(getattr(x, "dtype", type(x)))
+        output_shape = list(first_shape)
+        output_shape[self.axis] = total_size_on_axis
+        dtype = dtypes.result_type(*dtypes_to_resolve)
+        return KerasTensor(output_shape, dtype=dtype, sparse=all_sparse)
+
+
+@keras_export(
+    [
+        "keras.ops.concatenate",
+        "keras.ops.numpy.concatenate",
+    ]
+)
+def concatenate(xs, axis=0):
+    """Join a sequence of tensors along an existing axis.
+
+    Args:
+        xs: The sequence of tensors to concatenate.
+        axis: The axis along which the tensors will be joined. Defaults to `0`.
+
+    Returns:
+        The concatenated tensor.
+    """
+    if any_symbolic_tensors(xs):
+        return Concatenate(axis=axis).symbolic_call(xs)
+    return backend.numpy.concatenate(xs, axis=axis)
+
+
+class Conjugate(Operation):
+    def call(self, x):
+        return backend.numpy.conjugate(x)
+
+    def compute_output_spec(self, x):
+        sparse = getattr(x, "sparse", False)
+        return KerasTensor(x.shape, dtype=x.dtype, sparse=sparse)
+
+
+@keras_export(["keras.ops.conjugate", "keras.ops.numpy.conjugate"])
+def conjugate(x):
+    """Returns the complex conjugate, element-wise.
+
+    The complex conjugate of a complex number is obtained by changing the sign
+    of its imaginary part.
+
+    `keras.ops.conj` is a shorthand for this function.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        The complex conjugate of each element in `x`.
+    """
+    if any_symbolic_tensors((x,)):
+        return Conjugate().symbolic_call(x)
+    return backend.numpy.conjugate(x)
+
+
+class Conj(Conjugate):
+    pass
+
+
+@keras_export(["keras.ops.conj", "keras.ops.numpy.conj"])
+def conj(x):
+    """Shorthand for `keras.ops.conjugate`."""
+    return conjugate(x)
+
+
+class Copy(Operation):
+    def call(self, x):
+        return backend.numpy.copy(x)
+
+    def compute_output_spec(self, x):
+        sparse = getattr(x, "sparse", False)
+        return KerasTensor(x.shape, dtype=x.dtype, sparse=sparse)
+
+
+@keras_export(["keras.ops.copy", "keras.ops.numpy.copy"])
+def copy(x):
+    """Returns a copy of `x`.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        A copy of `x`.
+    """
+    if any_symbolic_tensors((x,)):
+        return Copy().symbolic_call(x)
+    return backend.numpy.copy(x)
+
+
+class Cos(Operation):
+    def call(self, x):
+        return backend.numpy.cos(x)
+
+    def compute_output_spec(self, x):
+        dtype = backend.standardize_dtype(getattr(x, "dtype", backend.floatx()))
+        if dtype == "int64":
+            dtype = backend.floatx()
+        else:
+            dtype = dtypes.result_type(dtype, float)
+        return KerasTensor(x.shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.cos", "keras.ops.numpy.cos"])
+def cos(x):
+    """Cosine, element-wise.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        The corresponding cosine values.
+    """
+    if any_symbolic_tensors((x,)):
+        return Cos().symbolic_call(x)
+    return backend.numpy.cos(x)
+
+
+class Cosh(Operation):
+    def call(self, x):
+        return backend.numpy.cosh(x)
+
+    def compute_output_spec(self, x):
+        dtype = backend.standardize_dtype(getattr(x, "dtype", backend.floatx()))
+        if dtype == "int64":
+            dtype = backend.floatx()
+        else:
+            dtype = dtypes.result_type(dtype, float)
+        return KerasTensor(x.shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.cosh", "keras.ops.numpy.cosh"])
+def cosh(x):
+    """Hyperbolic cosine, element-wise.
+
+    Arguments:
+        x: Input tensor.
+
+    Returns:
+        Output tensor of same shape as `x`.
+    """
+    if any_symbolic_tensors((x,)):
+        return Cosh().symbolic_call(x)
+    return backend.numpy.cosh(x)
+
+
+class CountNonzero(Operation):
+    def __init__(self, axis=None):
+        super().__init__()
+        if isinstance(axis, int):
+            self.axis = (axis,)
+        else:
+            self.axis = axis
+
+    def call(self, x):
+        return backend.numpy.count_nonzero(x, axis=self.axis)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(
+            reduce_shape(x.shape, axis=self.axis),
+            dtype="int32",
+        )
+
+
+@keras_export(
+    [
+        "keras.ops.count_nonzero",
+        "keras.ops.numpy.count_nonzero",
+    ]
+)
+def count_nonzero(x, axis=None):
+    """Counts the number of non-zero values in `x` along the given `axis`.
+
+    If no axis is specified then all non-zeros in the tensor are counted.
+
+    Args:
+        x: Input tensor.
+        axis: Axis or tuple of axes along which to count the number of
+            non-zeros. Defaults to `None`.
+
+    Returns:
+        int or tensor of ints.
+
+    Examples:
+    >>> x = keras.ops.array([[0, 1, 7, 0], [3, 0, 2, 19]])
+    >>> keras.ops.count_nonzero(x)
+    5
+    >>> keras.ops.count_nonzero(x, axis=0)
+    array([1, 1, 2, 1], dtype=int64)
+    >>> keras.ops.count_nonzero(x, axis=1)
+    array([2, 3], dtype=int64)
+    """
+    if any_symbolic_tensors((x,)):
+        return CountNonzero(axis=axis).symbolic_call(x)
+    return backend.numpy.count_nonzero(x, axis=axis)
+
+
+class Cross(Operation):
+    def __init__(self, axisa=-1, axisb=-1, axisc=-1, axis=None):
+        super().__init__()
+        if axis is not None:
+            self.axisa = axis
+            self.axisb = axis
+            self.axisc = axis
+        else:
+            self.axisa = axisa
+            self.axisb = axisb
+            self.axisc = axisc
+
+    def call(self, x1, x2):
+        return backend.numpy.cross(x1, x2, self.axisa, self.axisb, self.axisc)
+
+    def compute_output_spec(self, x1, x2):
+        x1_shape = list(x1.shape)
+        x2_shape = list(x2.shape)
+
+        x1_value_size = x1_shape[self.axisa]
+        x2_value_size = x2_shape[self.axisa]
+        del x1_shape[self.axisa]
+        del x2_shape[self.axisb]
+        output_shape = broadcast_shapes(x1_shape, x2_shape)
+
+        if x1_value_size is not None and x1_value_size not in (2, 3):
+            raise ValueError(
+                "`x1`'s dim on `axis={axisa}` must be either 2 or 3, but "
+                f"received: {x1_value_size}"
+            )
+        if x2_value_size is not None and x2_value_size not in (2, 3):
+            raise ValueError(
+                "`x2`'s dim on `axis={axisb}` must be either 2 or 3, but "
+                f"received: {x2_value_size}"
+            )
+
+        if x1_value_size == 3 or x2_value_size == 3:
+            value_size = [3]
+        else:
+            value_size = []
+
+        output_shape = (
+            output_shape[: self.axisc] + value_size + output_shape[self.axisc :]
+        )
+
+        dtype = dtypes.result_type(x1.dtype, x2.dtype)
+        return KerasTensor(output_shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.cross", "keras.ops.numpy.cross"])
+def cross(x1, x2, axisa=-1, axisb=-1, axisc=-1, axis=None):
+    """Returns the cross product of two (arrays of) vectors.
+
+    The cross product of `x1` and `x2` in R^3 is a vector
+    perpendicular to both `x1` and `x2`. If `x1` and `x2` are arrays of
+    vectors, the vectors are defined by the last axis of `x1` and `x2`
+    by default, and these axes can have dimensions 2 or 3.
+
+    Where the dimension of either `x1` or `x2` is 2, the third component of
+    the input vector is assumed to be zero and the cross product calculated
+    accordingly.
+
+    In cases where both input vectors have dimension 2, the z-component of
+    the cross product is returned.
+
+    Args:
+        x1: Components of the first vector(s).
+        x2: Components of the second vector(s).
+        axisa: Axis of `x1` that defines the vector(s). Defaults to `-1`.
+        axisb: Axis of `x2` that defines the vector(s). Defaults to `-1`.
+        axisc: Axis of the result containing the cross product vector(s).
+            Ignored if both input vectors have dimension 2, as the return is
+            scalar. By default, the last axis.
+        axis: If defined, the axis of `x1`, `x2` and the result that
+            defines the vector(s) and cross product(s). Overrides `axisa`,
+            `axisb` and `axisc`.
+
+    Note:
+        Torch backend does not support two dimensional vectors, or the
+        arguments `axisa`, `axisb` and `axisc`. Use `axis` instead.
+
+    Returns:
+        Vector cross product(s).
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return Cross(
+            axisa=axisa, axisb=axisb, axisc=axisc, axis=axis
+        ).symbolic_call(x1, x2)
+    return backend.numpy.cross(
+        x1,
+        x2,
+        axisa=axisa,
+        axisb=axisb,
+        axisc=axisc,
+        axis=axis,
+    )
+
+
+class Cumprod(Operation):
+    def __init__(self, axis=None, dtype=None):
+        super().__init__()
+        self.axis = axis
+        self.dtype = dtype
+
+    def call(self, x):
+        return backend.numpy.cumprod(x, axis=self.axis, dtype=self.dtype)
+
+    def compute_output_spec(self, x):
+        if self.axis is None:
+            if None in x.shape:
+                output_shape = (None,)
+            else:
+                output_shape = (int(np.prod(x.shape)),)
+        else:
+            output_shape = x.shape
+        output_dtype = backend.standardize_dtype(self.dtype or x.dtype)
+        if output_dtype == "bool":
+            output_dtype = "int32"
+        return KerasTensor(output_shape, output_dtype)
+
+
+@keras_export(["keras.ops.cumprod", "keras.ops.numpy.cumprod"])
+def cumprod(x, axis=None, dtype=None):
+    """Return the cumulative product of elements along a given axis.
+
+    Args:
+        x: Input tensor.
+        axis: Axis along which the cumulative product is computed.
+            By default the input is flattened.
+        dtype: dtype of returned tensor. Defaults to x.dtype.
+
+    Returns:
+        Output tensor.
+    """
+    return Cumprod(axis=axis, dtype=dtype)(x)
+
+
+class Cumsum(Operation):
+    def __init__(self, axis=None, dtype=None):
+        super().__init__()
+        self.axis = axis
+        self.dtype = dtype
+
+    def call(self, x):
+        return backend.numpy.cumsum(x, axis=self.axis, dtype=self.dtype)
+
+    def compute_output_spec(self, x):
+        if self.axis is None:
+            if None in x.shape:
+                output_shape = (None,)
+            else:
+                output_shape = (int(np.prod(x.shape)),)
+        else:
+            output_shape = x.shape
+        output_dtype = backend.standardize_dtype(self.dtype or x.dtype)
+        if output_dtype == "bool":
+            output_dtype = "int32"
+        return KerasTensor(output_shape, output_dtype)
+
+
+@keras_export(["keras.ops.cumsum", "keras.ops.numpy.cumsum"])
+def cumsum(x, axis=None, dtype=None):
+    """Returns the cumulative sum of elements along a given axis.
+
+    Args:
+        x: Input tensor.
+        axis: Axis along which the cumulative sum is computed.
+            By default the input is flattened.
+        dtype: dtype of returned tensor. Defaults to x.dtype.
+
+    Returns:
+        Output tensor.
+    """
+    return Cumsum(axis=axis, dtype=dtype)(x)
+
+
+class Diag(Operation):
+    def __init__(self, k=0):
+        super().__init__()
+        self.k = k
+
+    def call(self, x):
+        return backend.numpy.diag(x, k=self.k)
+
+    def compute_output_spec(self, x):
+        x_shape = x.shape
+        if len(x_shape) == 1:
+            if x_shape[0] is None:
+                output_shape = [None, None]
+            else:
+                output_shape = [
+                    x_shape[0] + int(np.abs(self.k)),
+                    x_shape[0] + int(np.abs(self.k)),
+                ]
+        elif len(x_shape) == 2:
+            if None in x_shape:
+                output_shape = [None]
+            else:
+                shorter_side = np.minimum(x_shape[0], x_shape[1])
+                if self.k > 0:
+                    remaining = x_shape[1] - self.k
+                else:
+                    remaining = x_shape[0] + self.k
+                output_shape = [
+                    int(np.maximum(0, np.minimum(remaining, shorter_side)))
+                ]
+        else:
+            raise ValueError(
+                f"`x` must be 1-D or 2-D, but received shape {x.shape}."
+            )
+        return KerasTensor(output_shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.diag", "keras.ops.numpy.diag"])
+def diag(x, k=0):
+    """Extract a diagonal or construct a diagonal array.
+
+    Args:
+        x: Input tensor. If `x` is 2-D, returns the k-th diagonal of `x`.
+            If `x` is 1-D, return a 2-D tensor with `x` on the k-th diagonal.
+        k: The diagonal to consider. Defaults to `0`. Use `k > 0` for diagonals
+            above the main diagonal, and `k < 0` for diagonals below
+            the main diagonal.
+
+    Returns:
+        The extracted diagonal or constructed diagonal tensor.
+
+    Examples:
+    >>> from keras.src import ops
+    >>> x = ops.arange(9).reshape((3, 3))
+    >>> x
+    array([[0, 1, 2],
+           [3, 4, 5],
+           [6, 7, 8]])
+
+    >>> ops.diag(x)
+    array([0, 4, 8])
+    >>> ops.diag(x, k=1)
+    array([1, 5])
+    >>> ops.diag(x, k=-1)
+    array([3, 7])
+
+    >>> ops.diag(ops.diag(x)))
+    array([[0, 0, 0],
+           [0, 4, 0],
+           [0, 0, 8]])
+    """
+    if any_symbolic_tensors((x,)):
+        return Diag(k=k).symbolic_call(x)
+    return backend.numpy.diag(x, k=k)
+
+
+class Diagflat(Operation):
+    def __init__(self, k=0):
+        super().__init__()
+        self.k = k
+
+    def call(self, x):
+        return backend.numpy.diagflat(x, k=self.k)
+
+    def compute_output_spec(self, x):
+        x_shape = x.shape
+
+        if len(x_shape) == 0:
+            flat_size = 1
+        elif len(x_shape) == 1:
+            flat_size = x_shape[0] if x_shape[0] is not None else None
+        else:
+            flat_size = None
+            for s in x_shape:
+                if s is None:
+                    flat_size = None
+                    break
+                elif flat_size is None:
+                    flat_size = s
+                else:
+                    flat_size *= s
+
+        if flat_size is None:
+            output_shape = [None, None]
+        else:
+            output_shape = [
+                flat_size + int(np.abs(self.k)),
+                flat_size + int(np.abs(self.k)),
+            ]
+
+        return KerasTensor(output_shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.diagflat", "keras.ops.numpy.diagflat"])
+def diagflat(x, k=0):
+    """Create a two-dimensional array with the flattened input on
+       the k-th diagonal.
+
+    Args:
+        x: Input tensor to be flattened and placed on the diagonal.
+        k: The diagonal to place the flattened input. Defaults to `0`.
+           Use `k > 0` for diagonals above the main diagonal,
+           and `k < 0` for diagonals below the main diagonal.
+
+    Returns:
+        A 2-D tensor with the flattened input on the specified diagonal.
+    """
+    if any_symbolic_tensors((x,)):
+        return Diagflat(k=k).symbolic_call(x)
+    return backend.numpy.diagflat(x, k=k)
+
+
+class Diagonal(Operation):
+    def __init__(self, offset=0, axis1=0, axis2=1):
+        super().__init__()
+        self.offset = offset
+        self.axis1 = axis1
+        self.axis2 = axis2
+
+    def call(self, x):
+        return backend.numpy.diagonal(
+            x,
+            offset=self.offset,
+            axis1=self.axis1,
+            axis2=self.axis2,
+        )
+
+    def compute_output_spec(self, x):
+        x_shape = list(x.shape)
+        if len(x_shape) < 2:
+            raise ValueError(
+                "`diagonal` requires an array of at least two dimensions, but "
+                "`x` is of shape {x.shape}."
+            )
+
+        shape_2d = [x_shape[self.axis1], x_shape[self.axis2]]
+        x_shape[self.axis1] = -1
+        x_shape[self.axis2] = -1
+        output_shape = list(filter((-1).__ne__, x_shape))
+        if None in shape_2d:
+            diag_shape = [None]
+        else:
+            shorter_side = np.minimum(shape_2d[0], shape_2d[1])
+            if self.offset > 0:
+                remaining = shape_2d[1] - self.offset
+            else:
+                remaining = shape_2d[0] + self.offset
+            diag_shape = [
+                int(np.maximum(0, np.minimum(remaining, shorter_side)))
+            ]
+        output_shape = output_shape + diag_shape
+        return KerasTensor(output_shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.diagonal", "keras.ops.numpy.diagonal"])
+def diagonal(x, offset=0, axis1=0, axis2=1):
+    """Return specified diagonals.
+
+    If `x` is 2-D, returns the diagonal of `x` with the given offset, i.e., the
+    collection of elements of the form `x[i, i+offset]`.
+
+    If `x` has more than two dimensions, the axes specified by `axis1`
+    and `axis2` are used to determine the 2-D sub-array whose diagonal
+    is returned.
+
+    The shape of the resulting array can be determined by removing `axis1`
+    and `axis2` and appending an index to the right equal to the size of
+    the resulting diagonals.
+
+    Args:
+        x: Input tensor.
+        offset: Offset of the diagonal from the main diagonal.
+            Can be positive or negative. Defaults to `0`.(main diagonal).
+        axis1: Axis to be used as the first axis of the 2-D sub-arrays.
+            Defaults to `0`.(first axis).
+        axis2: Axis to be used as the second axis of the 2-D sub-arrays.
+            Defaults to `1` (second axis).
+
+    Returns:
+        Tensor of diagonals.
+
+    Examples:
+    >>> from keras.src import ops
+    >>> x = ops.arange(4).reshape((2, 2))
+    >>> x
+    array([[0, 1],
+           [2, 3]])
+    >>> x.diagonal()
+    array([0, 3])
+    >>> x.diagonal(1)
+    array([1])
+
+    >>> x = ops.arange(8).reshape((2, 2, 2))
+    >>> x
+    array([[[0, 1],
+            [2, 3]],
+           [[4, 5],
+            [6, 7]]])
+    >>> x.diagonal(0, 0, 1)
+    array([[0, 6],
+           [1, 7]])
+    """
+    if any_symbolic_tensors((x,)):
+        return Diagonal(
+            offset=offset,
+            axis1=axis1,
+            axis2=axis2,
+        ).symbolic_call(x)
+    return backend.numpy.diagonal(
+        x,
+        offset=offset,
+        axis1=axis1,
+        axis2=axis2,
+    )
+
+
+class Diff(Operation):
+    def __init__(self, n=1, axis=-1):
+        super().__init__()
+        self.n = n
+        self.axis = axis
+
+    def call(self, a):
+        return backend.numpy.diff(a, n=self.n, axis=self.axis)
+
+    def compute_output_spec(self, a):
+        shape = list(a.shape)
+        size = shape[self.axis]
+        if size is not None:
+            shape[self.axis] = builtins.max(size - self.n, 0)
+        return KerasTensor(shape, dtype=a.dtype)
+
+
+@keras_export(["keras.ops.diff", "keras.ops.numpy.diff"])
+def diff(a, n=1, axis=-1):
+    """Calculate the n-th discrete difference along the given axis.
+
+    The first difference is given by `out[i] = a[i+1] - a[i]` along
+    the given axis, higher differences are calculated by using `diff`
+    recursively.
+
+    Args:
+        a: Input tensor.
+        n: The number of times values are differenced. Defaults to `1`.
+        axis: Axis to compute discrete difference(s) along.
+            Defaults to `-1`.(last axis).
+
+    Returns:
+        Tensor of diagonals.
+
+    Examples:
+    >>> from keras.src import ops
+    >>> x = ops.convert_to_tensor([1, 2, 4, 7, 0])
+    >>> ops.diff(x)
+    array([ 1,  2,  3, -7])
+    >>> ops.diff(x, n=2)
+    array([  1,   1, -10])
+
+    >>> x = ops.convert_to_tensor([[1, 3, 6, 10], [0, 5, 6, 8]])
+    >>> ops.diff(x)
+    array([[2, 3, 4],
+           [5, 1, 2]])
+    >>> ops.diff(x, axis=0)
+    array([[-1,  2,  0, -2]])
+    """
+    return Diff(n=n, axis=axis)(a)
+
+
+class Digitize(Operation):
+    def call(self, x, bins):
+        return backend.numpy.digitize(x, bins)
+
+    def compute_output_spec(self, x, bins):
+        bins_shape = bins.shape
+        if len(bins_shape) > 1:
+            raise ValueError(
+                f"`bins` must be a 1D array. Received: bins={bins} "
+                f"with shape bins.shape={bins_shape}"
+            )
+        sparse = getattr(x, "sparse", False)
+        return KerasTensor(x.shape, dtype="int32", sparse=sparse)
+
+
+@keras_export(["keras.ops.digitize", "keras.ops.numpy.digitize"])
+def digitize(x, bins):
+    """Returns the indices of the bins to which each value in `x` belongs.
+
+    Args:
+        x: Input array to be binned.
+        bins: Array of bins. It has to be one-dimensional and monotonically
+            increasing.
+
+    Returns:
+        Output array of indices, of same shape as `x`.
+
+    Example:
+    >>> x = np.array([0.0, 1.0, 3.0, 1.6])
+    >>> bins = np.array([0.0, 3.0, 4.5, 7.0])
+    >>> keras.ops.digitize(x, bins)
+    array([1, 1, 2, 1])
+    """
+    if any_symbolic_tensors((x, bins)):
+        return Digitize().symbolic_call(x, bins)
+    return backend.numpy.digitize(x, bins)
+
+
+class Dot(Operation):
+    def call(self, x1, x2):
+        return backend.numpy.dot(x1, x2)
+
+    def compute_output_spec(self, x1, x2):
+        x1_shape = list(getattr(x1, "shape", []))
+        x2_shape = list(getattr(x2, "shape", []))
+        dtype = dtypes.result_type(
+            getattr(x1, "dtype", type(x1)),
+            getattr(x2, "dtype", type(x2)),
+        )
+        if x1_shape == [] or x2_shape == []:
+            return multiply(x1, x2)
+        if len(x1_shape) == 1 and len(x2_shape) == 1:
+            return KerasTensor([], dtype=dtype)
+        if len(x2_shape) == 1:
+            if x1_shape[-1] != x2_shape[0]:
+                raise ValueError(
+                    "Shape must match on the last axis of `x1` and `x2` when "
+                    "`x1` is N-d array while `x2` is 1-D, but receive shape "
+                    f"`x1.shape={x1.shape}` and x2.shape=`{x2.shape}`."
+                )
+            return KerasTensor(x1_shape[:-1], dtype=dtype)
+
+        if (
+            x1_shape[-1] is None
+            or x2_shape[-2] is None
+            or x1_shape[-1] == x2_shape[-2]
+        ):
+            del x1_shape[-1]
+            del x2_shape[-2]
+            return KerasTensor(x1_shape + x2_shape, dtype=dtype)
+
+        raise ValueError(
+            "Shape must match on the last axis of `x1` and second last "
+            "axis of `x2` when `x1` is N-d array while `x2` is M-D, but "
+            f"received `x1.shape={x1.shape}` and x2.shape=`{x2.shape}`."
+        )
+
+
+@keras_export(["keras.ops.dot", "keras.ops.numpy.dot"])
+def dot(x1, x2):
+    """Dot product of two tensors.
+
+    - If both `x1` and `x2` are 1-D tensors, it is inner product of vectors
+      (without complex conjugation).
+    - If both `x1` and `x2` are 2-D tensors, it is matrix multiplication.
+    - If either `x1` or `x2` is 0-D (scalar), it is equivalent to `x1 * x2`.
+    - If `x1` is an N-D tensor and `x2` is a 1-D tensor, it is a sum product
+      over the last axis of `x1` and `x2`.
+    - If `x1` is an N-D tensor and `x2` is an M-D tensor (where `M>=2`),
+      it is a sum product over the last axis of `x1` and the second-to-last
+      axis of `x2`: `dot(x1, x2)[i,j,k,m] = sum(a[i,j,:] * b[k,:,m])`.
+
+    Args:
+        x1: First argument.
+        x2: Second argument.
+
+    Note:
+        Torch backend does not accept 0-D tensors as arguments.
+
+    Returns:
+        Dot product of `x1` and `x2`.
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return Dot().symbolic_call(x1, x2)
+    return backend.numpy.dot(x1, x2)
+
+
+class Einsum(Operation):
+    def __init__(self, subscripts):
+        super().__init__()
+        self.subscripts = subscripts
+
+    def call(self, *operands):
+        return backend.numpy.einsum(self.subscripts, *operands)
+
+    def compute_output_spec(self, *operands):
+        """Compute the output shape of `einsum`.
+
+        The shape computation follows the steps below:
+        1. Find all letters in the input specs (left part of "->"), and
+            break them into two categories: letters appearing more than once
+            go to `reduced_dims`, otherwise go to `kept_dims`.
+        2. Adjust `reduced_dims` and `kept_dims` based on the output spec
+            (right part of "->"). The rule is if the letter appears in the
+            output spec, then move it to `kept_dims`, otherwise move it to
+            `reduced_dims`.
+        3. Compute the target output shape. If no output spec is set, then
+            the target output shape will be "...{kept_dims}", e.g., "...ijk",
+            else it will be the same as output spec. "..." is a wildcard that
+            could map shape of arbitrary length.
+        4. For each operand in `operands`, map the shape specified in the input
+            spec to the output target, e.g, if operand is of shape [2,3,4],
+            input spec is "i..." and output target is "i...jk", then 2 will go
+            the index 0. For dims not represented by any letter, insert to the
+            wildcard part. For each letter in output target not appearing in
+            input spec, the dim will be 1 for broadcasting. After 4, each
+            operand should have a target shape containing only number and
+            `None`.
+        5. Broadcast all shapes computed from 4, and the result is the output
+            shape.
+
+        Let's take an example to illustrate the steps above. Let's define:
+        ```python
+        x = KerasTensor([None, 3, 4])
+        y = KerasTensor(2, 4, 3)
+        z = knp.einsum("...ij, kji->...k", x, y)
+        ```
+
+        1. `reduced_dims` is {"i", "j"}, `kept_dims` is {"k"}.
+        2. `reduced_dims` is still {"i", "j"}, and `kept_dims` is {"k"}.
+        3. Output target is "...k".
+        4. For `x`, the input spec is "...ij", and the output target is "...k".
+            "i" and "j" do not appear in the output target, so no replacement
+            happens, and [None] goes to wildcard. Afterwards, "k" is replaced
+            by 1, so we get shape [None, 1]. Applying the same logic to `y`, we
+            get shape [2].
+        5. Broadcast [None, 1] and [2], and we get [None, 2], which is the
+            output shape.
+        """
+        split_subscripts = self.subscripts.split("->")
+        if len(split_subscripts) > 2:
+            raise ValueError(
+                "At most one '->' is supported in `einsum` subscripts, but "
+                f"received {self.subscripts}."
+            )
+        if len(split_subscripts) == 2:
+            subscripts = split_subscripts[0]
+            output_spec = split_subscripts[1]
+        else:
+            subscripts = self.subscripts
+            output_spec = None
+        input_specs = subscripts.split(",")
+        if len(input_specs) != len(operands):
+            raise ValueError(
+                f"Number of operands ({len(operands)}) does not match the "
+                f"number of input specs ({len(input_specs)}) in `einsum`, "
+                f"received subscripts={self.subscripts}."
+            )
+        reduced_dims = set()
+        kept_dims = set()
+        for s in subscripts:
+            if not s.isalpha():
+                continue
+            if s not in reduced_dims and s not in kept_dims:
+                kept_dims.add(s)
+            elif s in kept_dims:
+                kept_dims.remove(s)
+                reduced_dims.add(s)
+
+        if output_spec is not None:
+            # The output spec changes the rule of kept_dims and reduced_dims.
+            # In short, dims appearing in the output spec will be kept, and
+            # dims not appearing in the output spec will be reduced.
+            kept_dims_copy = kept_dims.copy()
+            reduced_dims_copy = reduced_dims.copy()
+            for dim in kept_dims:
+                if dim not in output_spec:
+                    kept_dims_copy.remove(dim)
+                    reduced_dims_copy.add(dim)
+            for dim in reduced_dims:
+                if dim in output_spec:
+                    reduced_dims_copy.remove(dim)
+                    kept_dims_copy.add(dim)
+            kept_dims = kept_dims_copy
+            reduced_dims = reduced_dims_copy
+
+        reduced_dims = sorted(reduced_dims)
+        kept_dims = sorted(kept_dims)
+
+        if output_spec is None:
+            target_broadcast_spec = "..." + "".join(kept_dims)
+        else:
+            target_broadcast_spec = output_spec
+
+        expanded_operands_shapes = []
+        for x, spec in zip(operands, input_specs):
+            x_shape = getattr(x, "shape", [])
+            x_shape = [-1 if size is None else size for size in x_shape]
+            split_spec = spec.split("...")
+            expanded_shape = target_broadcast_spec
+            if len(split_spec) == 1:
+                # In this case, the input spec is just a string of letters,
+                # e.g., "ijk".
+                if len(x_shape) != len(split_spec[0]):
+                    raise ValueError(
+                        "Number of dimensions in the subscript does not "
+                        "match the number of dimensions in the operand, "
+                        f"received subscript `{spec}` and operand of shape "
+                        f"{x_shape}."
+                    )
+                for size, s in zip(x_shape, split_spec[0]):
+                    # Replace the letter with the right shape.
+                    expanded_shape = expanded_shape.replace(s, str(size) + " ")
+                expanded_shape = expanded_shape.replace("...", "")
+            else:
+                # In this case, the input spec has "...", e.g., "i...j", "i...",
+                # or "...j".
+                for i in range(len(split_spec[0])):
+                    expanded_shape = expanded_shape.replace(
+                        split_spec[0][i], str(x_shape[i]) + " "
+                    )
+                for i in range(len(split_spec[1])):
+                    expanded_shape = expanded_shape.replace(
+                        split_spec[1][-i - 1], str(x_shape[-i - 1]) + " "
+                    )
+                # Shape matched by "..." will be inserted to the position of
+                # "...".
+                wildcard_shape_start_index = len(split_spec[0])
+                wildcard_shape_end_index = (
+                    len(x_shape)
+                    if len(split_spec[1]) == 0
+                    else -len(split_spec[1])
+                )
+                wildcard_shape = x_shape[
+                    wildcard_shape_start_index:wildcard_shape_end_index
+                ]
+                wildcard_shape_str = (
+                    " ".join([str(size) for size in wildcard_shape]) + " "
+                )
+                expanded_shape = expanded_shape.replace(
+                    "...", wildcard_shape_str
+                )
+            # Replace all letters not yet handled with "1" for broadcasting.
+            expanded_shape = re.sub("[a-z]", "1 ", expanded_shape)
+            expanded_shape = expanded_shape.split()
+            expanded_shape = [
+                None if size == "-1" else int(size) for size in expanded_shape
+            ]
+            expanded_operands_shapes.append(expanded_shape)
+
+        output_shape = expanded_operands_shapes[0]
+        for shape in expanded_operands_shapes[1:]:
+            output_shape = broadcast_shapes(output_shape, shape)
+        dtypes_to_resolve = list(
+            set(
+                backend.standardize_dtype(getattr(x, "dtype", type(x)))
+                for x in operands
+            )
+        )
+        if len(dtypes_to_resolve) == 1 and dtypes_to_resolve[0] == "int8":
+            dtype = "int32"
+        else:
+            dtype = dtypes.result_type(*dtypes_to_resolve)
+        return KerasTensor(output_shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.einsum", "keras.ops.numpy.einsum"])
+def einsum(subscripts, *operands):
+    """Evaluates the Einstein summation convention on the operands.
+
+    Args:
+        subscripts: Specifies the subscripts for summation as comma separated
+            list of subscript labels. An implicit (classical Einstein
+            summation) calculation is performed unless the explicit indicator
+            `->` is included as well as subscript labels of the precise
+            output form.
+        operands: The operands to compute the Einstein sum of.
+
+    Returns:
+        The calculation based on the Einstein summation convention.
+
+    Example:
+    >>> from keras.src import ops
+    >>> a = ops.arange(25).reshape(5, 5)
+    >>> b = ops.arange(5)
+    >>> c = ops.arange(6).reshape(2, 3)
+
+    Trace of a matrix:
+
+    >>> ops.einsum("ii", a)
+    60
+    >>> ops.einsum(a, [0, 0])
+    60
+    >>> ops.trace(a)
+    60
+
+    Extract the diagonal:
+
+    >>> ops.einsum("ii -> i", a)
+    array([ 0,  6, 12, 18, 24])
+    >>> ops.einsum(a, [0, 0], [0])
+    array([ 0,  6, 12, 18, 24])
+    >>> ops.diag(a)
+    array([ 0,  6, 12, 18, 24])
+
+    Sum over an axis:
+
+    >>> ops.einsum("ij -> i", a)
+    array([ 10,  35,  60,  85, 110])
+    >>> ops.einsum(a, [0, 1], [0])
+    array([ 10,  35,  60,  85, 110])
+    >>> ops.sum(a, axis=1)
+    array([ 10,  35,  60,  85, 110])
+
+    For higher dimensional tensors summing a single axis can be done
+    with ellipsis:
+
+    >>> ops.einsum("...j -> ...", a)
+    array([ 10,  35,  60,  85, 110])
+    >>> np.einsum(a, [..., 1], [...])
+    array([ 10,  35,  60,  85, 110])
+
+    Compute a matrix transpose or reorder any number of axes:
+
+    >>> ops.einsum("ji", c)
+    array([[0, 3],
+           [1, 4],
+           [2, 5]])
+    >>> ops.einsum("ij -> ji", c)
+    array([[0, 3],
+           [1, 4],
+           [2, 5]])
+    >>> ops.einsum(c, [1, 0])
+    array([[0, 3],
+           [1, 4],
+           [2, 5]])
+    >>> ops.transpose(c)
+    array([[0, 3],
+           [1, 4],
+           [2, 5]])
+
+    Matrix vector multiplication:
+
+    >>> ops.einsum("ij, j", a, b)
+    array([ 30,  80, 130, 180, 230])
+    >>> ops.einsum(a, [0, 1], b, [1])
+    array([ 30,  80, 130, 180, 230])
+    >>> ops.einsum("...j, j", a, b)
+    array([ 30,  80, 130, 180, 230])
+    """
+    if any_symbolic_tensors(operands):
+        return Einsum(subscripts).symbolic_call(*operands)
+    return backend.numpy.einsum(subscripts, *operands)
+
+
+class Empty(Operation):
+    def call(self, shape, dtype=None):
+        return backend.numpy.empty(shape, dtype=dtype)
+
+    def compute_output_spec(self, shape, dtype=None):
+        dtype = dtype or backend.floatx()
+        return KerasTensor(shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.empty", "keras.ops.numpy.empty"])
+def empty(shape, dtype=None):
+    """Return a tensor of given shape and type filled with uninitialized data.
+
+    Args:
+        shape: Shape of the empty tensor.
+        dtype: Desired data type of the empty tensor.
+
+    Returns:
+        The empty tensor.
+    """
+    return backend.numpy.empty(shape, dtype=dtype)
+
+
+class Equal(Operation):
+    def call(self, x1, x2):
+        return backend.numpy.equal(x1, x2)
+
+    def compute_output_spec(self, x1, x2):
+        x1_shape = getattr(x1, "shape", [])
+        x2_shape = getattr(x2, "shape", [])
+        output_shape = broadcast_shapes(x1_shape, x2_shape)
+        return KerasTensor(output_shape, dtype="bool")
+
+
+@keras_export(["keras.ops.equal", "keras.ops.numpy.equal"])
+def equal(x1, x2):
+    """Returns `(x1 == x2)` element-wise.
+
+    Args:
+        x1: Tensor to compare.
+        x2: Tensor to compare.
+
+    Returns:
+        Output tensor, element-wise comparison of `x1` and `x2`.
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return Equal().symbolic_call(x1, x2)
+    return backend.numpy.equal(x1, x2)
+
+
+class Exp(Operation):
+    def call(self, x):
+        return backend.numpy.exp(x)
+
+    def compute_output_spec(self, x):
+        dtype = backend.standardize_dtype(x.dtype)
+        if "int" in dtype or dtype == "bool":
+            dtype = backend.floatx()
+        return KerasTensor(x.shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.exp", "keras.ops.numpy.exp"])
+def exp(x):
+    """Calculate the exponential of all elements in the input tensor.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        Output tensor, element-wise exponential of `x`.
+    """
+    if any_symbolic_tensors((x,)):
+        return Exp().symbolic_call(x)
+    return backend.numpy.exp(x)
+
+
+class Exp2(Operation):
+    def call(self, x):
+        return backend.numpy.exp2(x)
+
+    def compute_output_spec(self, x):
+        dtype = backend.standardize_dtype(x.dtype)
+        if "int" in dtype or dtype == "bool":
+            dtype = backend.floatx()
+        return KerasTensor(x.shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.exp2", "keras.ops.numpy.exp2"])
+def exp2(x):
+    """Calculate the base-2 exponential of all elements in the input tensor.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        Output tensor, element-wise base-2 exponential of `x`.
+    """
+    if any_symbolic_tensors((x,)):
+        return Exp2().symbolic_call(x)
+    return backend.numpy.exp2(x)
+
+
+class ExpandDims(Operation):
+    def __init__(self, axis):
+        super().__init__()
+        if not isinstance(axis, (int, tuple, list)):
+            raise ValueError(
+                "The `axis` argument to `expand_dims` should be an integer, "
+                f"tuple or list. Received axis={axis}"
+            )
+        self.axis = axis
+
+    def call(self, x):
+        return backend.numpy.expand_dims(x, self.axis)
+
+    def compute_output_spec(self, x):
+        output_shape = operation_utils.compute_expand_dims_output_shape(
+            x.shape, self.axis
+        )
+        sparse = getattr(x, "sparse", False)
+        return KerasTensor(output_shape, dtype=x.dtype, sparse=sparse)
+
+
+@keras_export(
+    [
+        "keras.ops.expand_dims",
+        "keras.ops.numpy.expand_dims",
+    ]
+)
+def expand_dims(x, axis):
+    """Expand the shape of a tensor.
+
+    Insert a new axis at the `axis` position in the expanded tensor shape.
+
+    Args:
+        x: Input tensor.
+        axis: Position in the expanded axes where the new axis
+            (or axes) is placed.
+
+    Returns:
+        Output tensor with the number of dimensions increased.
+    """
+    if any_symbolic_tensors((x,)):
+        return ExpandDims(axis=axis).symbolic_call(x)
+    return backend.numpy.expand_dims(x, axis)
+
+
+class Expm1(Operation):
+    def call(self, x):
+        return backend.numpy.expm1(x)
+
+    def compute_output_spec(self, x):
+        dtype = backend.standardize_dtype(x.dtype)
+        if "int" in dtype or dtype == "bool":
+            dtype = backend.floatx()
+        sparse = getattr(x, "sparse", False)
+        return KerasTensor(x.shape, dtype=dtype, sparse=sparse)
+
+
+@keras_export(["keras.ops.expm1", "keras.ops.numpy.expm1"])
+def expm1(x):
+    """Calculate `exp(x) - 1` for all elements in the tensor.
+
+    Args:
+        x: Input values.
+
+    Returns:
+        Output tensor, element-wise exponential minus one.
+    """
+    if any_symbolic_tensors((x,)):
+        return Expm1().symbolic_call(x)
+    return backend.numpy.expm1(x)
+
+
+class Flip(Operation):
+    def __init__(self, axis=None):
+        super().__init__()
+        self.axis = axis
+
+    def call(self, x):
+        return backend.numpy.flip(x, axis=self.axis)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.flip", "keras.ops.numpy.flip"])
+def flip(x, axis=None):
+    """Reverse the order of elements in the tensor along the given axis.
+
+    The shape of the tensor is preserved, but the elements are reordered.
+
+    Args:
+        x: Input tensor.
+        axis: Axis or axes along which to flip the tensor. The default,
+            `axis=None`, will flip over all of the axes of the input tensor.
+
+    Returns:
+        Output tensor with entries of `axis` reversed.
+    """
+    if any_symbolic_tensors((x,)):
+        return Flip(axis=axis).symbolic_call(x)
+    return backend.numpy.flip(x, axis=axis)
+
+
+class Floor(Operation):
+    def call(self, x):
+        return backend.numpy.floor(x)
+
+    def compute_output_spec(self, x):
+        sparse = getattr(x, "sparse", False)
+        dtype = (
+            backend.floatx()
+            if backend.standardize_dtype(x.dtype) == "int64"
+            else dtypes.result_type(x.dtype, float)
+        )
+        return KerasTensor(x.shape, dtype=dtype, sparse=sparse)
+
+
+@keras_export(["keras.ops.floor", "keras.ops.numpy.floor"])
+def floor(x):
+    """Return the floor of the input, element-wise.
+
+    The floor of the scalar `x` is the largest integer `i`, such that `i <= x`.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        Output tensor, element-wise floor of `x`.
+    """
+    if any_symbolic_tensors((x,)):
+        return Floor().symbolic_call(x)
+    return backend.numpy.floor(x)
+
+
+class Full(Operation):
+    def call(self, shape, fill_value, dtype=None):
+        return backend.numpy.full(shape, fill_value, dtype=dtype)
+
+    def compute_output_spec(self, shape, fill_value, dtype=None):
+        dtype = dtype or backend.floatx()
+        return KerasTensor(shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.full", "keras.ops.numpy.full"])
+def full(shape, fill_value, dtype=None):
+    """Return a new tensor of given shape and type, filled with `fill_value`.
+
+    Args:
+        shape: Shape of the new tensor.
+        fill_value: Fill value.
+        dtype: Desired data type of the tensor.
+
+    Returns:
+        Output tensor.
+    """
+    return backend.numpy.full(shape, fill_value, dtype=dtype)
+
+
+class FullLike(Operation):
+    def call(self, x, fill_value, dtype=None):
+        return backend.numpy.full_like(x, fill_value, dtype=dtype)
+
+    def compute_output_spec(self, x, fill_value, dtype=None):
+        dtype = dtype or x.dtype
+        return KerasTensor(x.shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.full_like", "keras.ops.numpy.full_like"])
+def full_like(x, fill_value, dtype=None):
+    """Return a full tensor with the same shape and type as the given tensor.
+
+    Args:
+        x: Input tensor.
+        fill_value: Fill value.
+        dtype: Overrides data type of the result.
+
+    Returns:
+        Tensor of `fill_value` with the same shape and type as `x`.
+    """
+    if any_symbolic_tensors((x,)):
+        return FullLike().symbolic_call(x, fill_value, dtype=dtype)
+    return backend.numpy.full_like(x, fill_value, dtype=dtype)
+
+
+class GetItem(Operation):
+    def call(self, x, key):
+        if isinstance(key, list):
+            key = tuple(key)
+        return x[key]
+
+    def compute_output_spec(self, x, key):
+        remaining_shape = list(x.shape)
+        new_shape = []
+        if isinstance(key, int):
+            remaining_key = [key]
+        elif isinstance(key, tuple):
+            remaining_key = list(key)
+        elif isinstance(key, list):
+            remaining_key = key.copy()
+        else:
+            raise ValueError(
+                f"Unsupported key type for array slice. Received: `{key}`"
+            )
+        num_ellipses = remaining_key.count(Ellipsis)
+        if num_ellipses > 1:
+            raise ValueError(
+                f"Slice should only have one ellipsis. Received: `{key}`"
+            )
+        elif num_ellipses == 0:
+            # Add an implicit final ellipsis.
+            remaining_key.append(Ellipsis)
+        # Consume slice key element by element.
+        while True:
+            if not remaining_key:
+                break
+            subkey = remaining_key.pop(0)
+            # Check for `newaxis` and `Ellipsis`.
+            if subkey == Ellipsis:
+                # Keep as many slices remain in our key, omitting `newaxis`.
+                needed = len(remaining_key) - remaining_key.count(np.newaxis)
+                consumed = len(remaining_shape) - needed
+                new_shape += remaining_shape[:consumed]
+                remaining_shape = remaining_shape[consumed:]
+                continue
+            # All frameworks follow numpy for newaxis. `np.newaxis == None`.
+            if subkey == np.newaxis:
+                new_shape.append(1)
+                continue
+            # At this point, we need to consume a new axis from the shape.
+            if not remaining_shape:
+                raise ValueError(
+                    f"Array has shape {x.shape} but slice "
+                    f"has to many indices. Received: `{key}`"
+                )
+            length = remaining_shape.pop(0)
+            if isinstance(subkey, int):
+                if length is not None:
+                    index = subkey if subkey >= 0 else subkey + length
+                    if index < 0 or index >= length:
+                        raise ValueError(
+                            f"Array has shape {x.shape} but out-of-bounds "
+                            f"index {key} was requested."
+                        )
+            elif isinstance(subkey, slice):
+                if length is not None:
+                    # python3 friendly way to compute a slice length.
+                    new_length = len(range(*subkey.indices(length)))
+                    new_shape.append(new_length)
+                else:
+                    new_shape.append(length)
+            else:
+                raise ValueError(
+                    f"Unsupported key type for array slice. Received: `{key}`"
+                )
+        return KerasTensor(tuple(new_shape), dtype=x.dtype)
+
+
+@keras_export(["keras.ops.get_item", "keras.ops.numpy.get_item"])
+def get_item(x, key):
+    """Return `x[key]`."""
+    if any_symbolic_tensors((x,)):
+        return GetItem().symbolic_call(x, key)
+    return x[key]
+
+
+class Greater(Operation):
+    def call(self, x1, x2):
+        return backend.numpy.greater(x1, x2)
+
+    def compute_output_spec(self, x1, x2):
+        x1_shape = getattr(x1, "shape", [])
+        x2_shape = getattr(x2, "shape", [])
+        output_shape = broadcast_shapes(x1_shape, x2_shape)
+        return KerasTensor(output_shape, dtype="bool")
+
+
+@keras_export(["keras.ops.greater", "keras.ops.numpy.greater"])
+def greater(x1, x2):
+    """Return the truth value of `x1 > x2` element-wise.
+
+    Args:
+        x1: First input tensor.
+        x2: Second input tensor.
+
+    Returns:
+        Output tensor, element-wise comparison of `x1` and `x2`.
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return Greater().symbolic_call(x1, x2)
+    return backend.numpy.greater(x1, x2)
+
+
+class GreaterEqual(Operation):
+    def call(self, x1, x2):
+        return backend.numpy.greater_equal(x1, x2)
+
+    def compute_output_spec(self, x1, x2):
+        x1_shape = getattr(x1, "shape", [])
+        x2_shape = getattr(x2, "shape", [])
+        output_shape = broadcast_shapes(x1_shape, x2_shape)
+        return KerasTensor(output_shape, dtype="bool")
+
+
+@keras_export(
+    [
+        "keras.ops.greater_equal",
+        "keras.ops.numpy.greater_equal",
+    ]
+)
+def greater_equal(x1, x2):
+    """Return the truth value of `x1 >= x2` element-wise.
+
+    Args:
+        x1: First input tensor.
+        x2: Second input tensor.
+
+    Returns:
+        Output tensor, element-wise comparison of `x1` and `x2`.
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return GreaterEqual().symbolic_call(x1, x2)
+    return backend.numpy.greater_equal(x1, x2)
+
+
+class Hstack(Operation):
+    def call(self, xs):
+        return backend.numpy.hstack(xs)
+
+    def compute_output_spec(self, xs):
+        first_shape = xs[0].shape
+        total_size_on_axis = 0
+        dtypes_to_resolve = []
+        for x in xs:
+            if not shape_equal(x.shape, first_shape, axis=[1], allow_none=True):
+                raise ValueError(
+                    "Every value in `xs` must have the same shape except on "
+                    f"the `axis` dim. But found element of shape {x.shape}, "
+                    f"which is different from the first element's "
+                    f"shape {first_shape}."
+                )
+            if total_size_on_axis is None or x.shape[1] is None:
+                total_size_on_axis = None
+            else:
+                total_size_on_axis += x.shape[1]
+            dtypes_to_resolve.append(getattr(x, "dtype", type(x)))
+        output_shape = list(first_shape)
+        output_shape[1] = total_size_on_axis
+        dtype = dtypes.result_type(*dtypes_to_resolve)
+        return KerasTensor(output_shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.hstack", "keras.ops.numpy.hstack"])
+def hstack(xs):
+    """Stack tensors in sequence horizontally (column wise).
+
+    This is equivalent to concatenation along the first axis for 1-D tensors,
+    and along the second axis for all other tensors.
+
+    Args:
+        xs: Sequence of tensors.
+
+    Returns:
+        The tensor formed by stacking the given tensors.
+    """
+    if any_symbolic_tensors((xs,)):
+        return Hstack().symbolic_call(xs)
+    return backend.numpy.hstack(xs)
+
+
+class Identity(Operation):
+    def call(self, n, dtype=None):
+        return backend.numpy.identity(n, dtype=dtype)
+
+    def compute_output_spec(self, n, dtype=None):
+        dtype = dtype or backend.floatx()
+        return KerasTensor([n, n], dtype=dtype)
+
+
+@keras_export(["keras.ops.identity", "keras.ops.numpy.identity"])
+def identity(n, dtype=None):
+    """Return the identity tensor.
+
+    The identity tensor is a square tensor with ones on the main diagonal and
+    zeros elsewhere.
+
+    Args:
+        n: Number of rows (and columns) in the `n x n` output tensor.
+        dtype: Data type of the output tensor.
+
+    Returns:
+        The identity tensor.
+    """
+    return backend.numpy.identity(n, dtype=dtype)
+
+
+class Imag(Operation):
+    def call(self, x):
+        return backend.numpy.imag(x)
+
+    def compute_output_spec(self, x):
+        sparse = getattr(x, "sparse", False)
+        return KerasTensor(x.shape, dtype=x.dtype, sparse=sparse)
+
+
+@keras_export(["keras.ops.imag", "keras.ops.numpy.imag"])
+def imag(x):
+    """Return the imaginary part of the complex argument.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        The imaginary component of the complex argument.
+    """
+    if any_symbolic_tensors((x,)):
+        return Imag().symbolic_call(x)
+    return backend.numpy.imag(x)
+
+
+class Isclose(Operation):
+    def call(self, x1, x2, rtol=1e-5, atol=1e-8, equal_nan=False):
+        return backend.numpy.isclose(x1, x2, rtol, atol, equal_nan)
+
+    def compute_output_spec(
+        self, x1, x2, rtol=1e-5, atol=1e-8, equal_nan=False
+    ):
+        x1_shape = getattr(x1, "shape", [])
+        x2_shape = getattr(x2, "shape", [])
+        output_shape = broadcast_shapes(x1_shape, x2_shape)
+        return KerasTensor(output_shape, dtype="bool")
+
+
+@keras_export(["keras.ops.isclose", "keras.ops.numpy.isclose"])
+def isclose(x1, x2, rtol=1e-5, atol=1e-8, equal_nan=False):
+    """Return whether two tensors are element-wise almost equal.
+
+    Args:
+        x1: First input tensor.
+        x2: Second input tensor.
+        rtol: Relative tolerance.
+        atol: Absolute tolerance.
+        equal_nan: If `True`, element-wise NaNs are considered equal.
+
+    Returns:
+        Output boolean tensor.
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return Isclose().symbolic_call(x1, x2, rtol, atol, equal_nan)
+    return backend.numpy.isclose(x1, x2, rtol, atol, equal_nan)
+
+
+class Isfinite(Operation):
+    def call(self, x):
+        return backend.numpy.isfinite(x)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype="bool")
+
+
+@keras_export(["keras.ops.isfinite", "keras.ops.numpy.isfinite"])
+def isfinite(x):
+    """Return whether a tensor is finite, element-wise.
+
+    Real values are finite when they are not NaN, not positive infinity, and
+    not negative infinity. Complex values are finite when both their real
+    and imaginary parts are finite.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        Output boolean tensor.
+    """
+    if any_symbolic_tensors((x,)):
+        return Isfinite().symbolic_call(x)
+    return backend.numpy.isfinite(x)
+
+
+class Isinf(Operation):
+    def call(self, x):
+        return backend.numpy.isinf(x)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype="bool")
+
+
+@keras_export(["keras.ops.isinf", "keras.ops.numpy.isinf"])
+def isinf(x):
+    """Test element-wise for positive or negative infinity.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        Output boolean tensor.
+    """
+    if any_symbolic_tensors((x,)):
+        return Isinf().symbolic_call(x)
+    return backend.numpy.isinf(x)
+
+
+class Isnan(Operation):
+    def call(self, x):
+        return backend.numpy.isnan(x)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype="bool")
+
+
+@keras_export(["keras.ops.isnan", "keras.ops.numpy.isnan"])
+def isnan(x):
+    """Test element-wise for NaN and return result as a boolean tensor.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        Output boolean tensor.
+    """
+    if any_symbolic_tensors((x,)):
+        return Isnan().symbolic_call(x)
+    return backend.numpy.isnan(x)
+
+
+class Less(Operation):
+    def call(self, x1, x2):
+        return backend.numpy.less(x1, x2)
+
+    def compute_output_spec(self, x1, x2):
+        x1_shape = getattr(x1, "shape", [])
+        x2_shape = getattr(x2, "shape", [])
+        output_shape = broadcast_shapes(x1_shape, x2_shape)
+        return KerasTensor(output_shape, dtype="bool")
+
+
+@keras_export(["keras.ops.less", "keras.ops.numpy.less"])
+def less(x1, x2):
+    """Return the truth value of `x1 < x2` element-wise.
+
+    Args:
+        x1: First input tensor.
+        x2: Second input tensor.
+
+    Returns:
+        Output tensor, element-wise comparison of `x1` and `x2`.
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return Less().symbolic_call(x1, x2)
+    return backend.numpy.less(x1, x2)
+
+
+class LessEqual(Operation):
+    def call(self, x1, x2):
+        return backend.numpy.less_equal(x1, x2)
+
+    def compute_output_spec(self, x1, x2):
+        x1_shape = getattr(x1, "shape", [])
+        x2_shape = getattr(x2, "shape", [])
+        output_shape = broadcast_shapes(x1_shape, x2_shape)
+        return KerasTensor(output_shape, dtype="bool")
+
+
+@keras_export(
+    [
+        "keras.ops.less_equal",
+        "keras.ops.numpy.less_equal",
+    ]
+)
+def less_equal(x1, x2):
+    """Return the truth value of `x1 <= x2` element-wise.
+
+    Args:
+        x1: First input tensor.
+        x2: Second input tensor.
+
+    Returns:
+        Output tensor, element-wise comparison of `x1` and `x2`.
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return LessEqual().symbolic_call(x1, x2)
+    return backend.numpy.less_equal(x1, x2)
+
+
+class Linspace(Operation):
+    def __init__(
+        self, num=50, endpoint=True, retstep=False, dtype=float, axis=0
+    ):
+        super().__init__()
+        self.num = num
+        self.endpoint = endpoint
+        self.retstep = retstep
+        self.dtype = dtype
+        self.axis = axis
+
+    def call(self, start, stop):
+        return backend.numpy.linspace(
+            start,
+            stop,
+            num=self.num,
+            endpoint=self.endpoint,
+            retstep=self.retstep,
+            dtype=self.dtype,
+            axis=self.axis,
+        )
+
+    def compute_output_spec(self, start, stop):
+        start_shape = getattr(start, "shape", [])
+        stop_shape = getattr(stop, "shape", [])
+        output_shape = broadcast_shapes(start_shape, stop_shape)
+        if self.axis == -1:
+            output_shape = output_shape + [self.num]
+        elif self.axis >= 0:
+            output_shape = (
+                output_shape[: self.axis]
+                + [self.num]
+                + output_shape[self.axis :]
+            )
+        else:
+            output_shape = (
+                output_shape[: self.axis + 1]
+                + [self.num]
+                + output_shape[self.axis + 1 :]
+            )
+
+        dtype = (
+            self.dtype
+            if self.dtype is not None
+            else getattr(start, "dtype", type(start))
+        )
+        dtype = backend.result_type(dtype, float)
+        if self.retstep:
+            return (KerasTensor(output_shape, dtype=dtype), None)
+        return KerasTensor(output_shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.linspace", "keras.ops.numpy.linspace"])
+def linspace(
+    start, stop, num=50, endpoint=True, retstep=False, dtype=None, axis=0
+):
+    """Return evenly spaced numbers over a specified interval.
+
+    Returns `num` evenly spaced samples, calculated over the interval
+    `[start, stop]`.
+
+    The endpoint of the interval can optionally be excluded.
+
+    Args:
+        start: The starting value of the sequence.
+        stop: The end value of the sequence, unless `endpoint` is set to
+            `False`. In that case, the sequence consists of all but the last
+            of `num + 1` evenly spaced samples, so that `stop` is excluded.
+            Note that the step size changes when `endpoint` is `False`.
+        num: Number of samples to generate. Defaults to `50`. Must be
+            non-negative.
+        endpoint: If `True`, `stop` is the last sample. Otherwise, it is
+            not included. Defaults to `True`.
+        retstep: If `True`, return `(samples, step)`, where `step` is the
+            spacing between samples.
+        dtype: The type of the output tensor.
+        axis: The axis in the result to store the samples. Relevant only if
+            start or stop are array-like. Defaults to `0`.
+
+    Note:
+        Torch backend does not support `axis` argument.
+
+    Returns:
+        A tensor of evenly spaced numbers.
+        If `retstep` is `True`, returns `(samples, step)`
+    """
+    if any_symbolic_tensors((start, stop)):
+        return Linspace(num, endpoint, retstep, dtype, axis)(start, stop)
+    return backend.numpy.linspace(
+        start,
+        stop,
+        num=num,
+        endpoint=endpoint,
+        retstep=retstep,
+        dtype=dtype,
+        axis=axis,
+    )
+
+
+class Log(Operation):
+    def call(self, x):
+        return backend.numpy.log(x)
+
+    def compute_output_spec(self, x):
+        dtype = (
+            backend.floatx()
+            if backend.standardize_dtype(x.dtype) == "int64"
+            else dtypes.result_type(x.dtype, float)
+        )
+        return KerasTensor(x.shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.log", "keras.ops.numpy.log"])
+def log(x):
+    """Natural logarithm, element-wise.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        Output tensor, element-wise natural logarithm of `x`.
+    """
+    if any_symbolic_tensors((x,)):
+        return Log().symbolic_call(x)
+    return backend.numpy.log(x)
+
+
+class Log10(Operation):
+    def call(self, x):
+        return backend.numpy.log10(x)
+
+    def compute_output_spec(self, x):
+        dtype = (
+            backend.floatx()
+            if backend.standardize_dtype(x.dtype) == "int64"
+            else dtypes.result_type(x.dtype, float)
+        )
+        return KerasTensor(x.shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.log10", "keras.ops.numpy.log10"])
+def log10(x):
+    """Return the base 10 logarithm of the input tensor, element-wise.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        Output tensor, element-wise base 10 logarithm of `x`.
+    """
+    if any_symbolic_tensors((x,)):
+        return Log10().symbolic_call(x)
+    return backend.numpy.log10(x)
+
+
+class Log1p(Operation):
+    def call(self, x):
+        return backend.numpy.log1p(x)
+
+    def compute_output_spec(self, x):
+        dtype = (
+            backend.floatx()
+            if backend.standardize_dtype(x.dtype) == "int64"
+            else dtypes.result_type(x.dtype, float)
+        )
+        sparse = getattr(x, "sparse", False)
+        return KerasTensor(x.shape, dtype=dtype, sparse=sparse)
+
+
+@keras_export(["keras.ops.log1p", "keras.ops.numpy.log1p"])
+def log1p(x):
+    """Returns the natural logarithm of one plus the `x`, element-wise.
+
+    Calculates `log(1 + x)`.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        Output tensor, element-wise natural logarithm of `1 + x`.
+    """
+    if any_symbolic_tensors((x,)):
+        return Log1p().symbolic_call(x)
+    return backend.numpy.log1p(x)
+
+
+class Log2(Operation):
+    def call(self, x):
+        return backend.numpy.log2(x)
+
+    def compute_output_spec(self, x):
+        dtype = (
+            backend.floatx()
+            if backend.standardize_dtype(x.dtype) == "int64"
+            else dtypes.result_type(x.dtype, float)
+        )
+        return KerasTensor(x.shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.log2", "keras.ops.numpy.log2"])
+def log2(x):
+    """Base-2 logarithm of `x`, element-wise.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        Output tensor, element-wise base-2 logarithm of `x`.
+    """
+    if any_symbolic_tensors((x,)):
+        return Log2().symbolic_call(x)
+    return backend.numpy.log2(x)
+
+
+class Logaddexp(Operation):
+    def call(self, x1, x2):
+        return backend.numpy.logaddexp(x1, x2)
+
+    def compute_output_spec(self, x1, x2):
+        x1_shape = getattr(x1, "shape", [])
+        x2_shape = getattr(x2, "shape", [])
+        output_shape = broadcast_shapes(x1_shape, x2_shape)
+        dtype = dtypes.result_type(
+            getattr(x1, "dtype", type(x1)),
+            getattr(x2, "dtype", type(x2)),
+            float,
+        )
+        return KerasTensor(output_shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.logaddexp", "keras.ops.numpy.logaddexp"])
+def logaddexp(x1, x2):
+    """Logarithm of the sum of exponentiations of the inputs.
+
+    Calculates `log(exp(x1) + exp(x2))`.
+
+    Args:
+        x1: Input tensor.
+        x2: Input tensor.
+
+    Returns:
+        Output tensor, element-wise logarithm of the sum of exponentiations
+        of the inputs.
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return Logaddexp().symbolic_call(x1, x2)
+    return backend.numpy.logaddexp(x1, x2)
+
+
+class LogicalAnd(Operation):
+    def call(self, x1, x2):
+        return backend.numpy.logical_and(x1, x2)
+
+    def compute_output_spec(self, x1, x2):
+        x1_shape = getattr(x1, "shape", [])
+        x2_shape = getattr(x2, "shape", [])
+        output_shape = broadcast_shapes(x1_shape, x2_shape)
+        return KerasTensor(output_shape, dtype="bool")
+
+
+@keras_export(
+    [
+        "keras.ops.logical_and",
+        "keras.ops.numpy.logical_and",
+    ]
+)
+def logical_and(x1, x2):
+    """Computes the element-wise logical AND of the given input tensors.
+
+    Zeros are treated as `False` and non-zeros are treated as `True`.
+
+    Args:
+        x1: Input tensor.
+        x2: Input tensor.
+
+    Returns:
+        Output tensor, element-wise logical AND of the inputs.
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return LogicalAnd().symbolic_call(x1, x2)
+    return backend.numpy.logical_and(x1, x2)
+
+
+class LogicalNot(Operation):
+    def call(self, x):
+        return backend.numpy.logical_not(x)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype="bool")
+
+
+@keras_export(
+    [
+        "keras.ops.logical_not",
+        "keras.ops.numpy.logical_not",
+    ]
+)
+def logical_not(x):
+    """Computes the element-wise NOT of the given input tensor.
+
+    Zeros are treated as `False` and non-zeros are treated as `True`.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        Output tensor, element-wise logical NOT of the input.
+    """
+    if any_symbolic_tensors((x,)):
+        return LogicalNot().symbolic_call(x)
+    return backend.numpy.logical_not(x)
+
+
+class LogicalOr(Operation):
+    def call(self, x1, x2):
+        return backend.numpy.logical_or(x1, x2)
+
+    def compute_output_spec(self, x1, x2):
+        x1_shape = getattr(x1, "shape", [])
+        x2_shape = getattr(x2, "shape", [])
+        output_shape = broadcast_shapes(x1_shape, x2_shape)
+        return KerasTensor(output_shape, dtype="bool")
+
+
+@keras_export(
+    [
+        "keras.ops.logical_or",
+        "keras.ops.numpy.logical_or",
+    ]
+)
+def logical_or(x1, x2):
+    """Computes the element-wise logical OR of the given input tensors.
+
+    Zeros are treated as `False` and non-zeros are treated as `True`.
+
+    Args:
+        x1: Input tensor.
+        x2: Input tensor.
+
+    Returns:
+        Output tensor, element-wise logical OR of the inputs.
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return LogicalOr().symbolic_call(x1, x2)
+    return backend.numpy.logical_or(x1, x2)
+
+
+class Logspace(Operation):
+    def __init__(self, num=50, endpoint=True, base=10, dtype=float, axis=0):
+        super().__init__()
+        self.num = num
+        self.endpoint = endpoint
+        self.base = base
+        self.dtype = dtype
+        self.axis = axis
+
+    def call(self, start, stop):
+        return backend.numpy.logspace(
+            start,
+            stop,
+            num=self.num,
+            endpoint=self.endpoint,
+            base=self.base,
+            dtype=self.dtype,
+            axis=self.axis,
+        )
+
+    def compute_output_spec(self, start, stop):
+        start_shape = getattr(start, "shape", [])
+        stop_shape = getattr(stop, "shape", [])
+        output_shape = broadcast_shapes(start_shape, stop_shape)
+        if self.axis == -1:
+            output_shape = output_shape + [self.num]
+        elif self.axis >= 0:
+            output_shape = (
+                output_shape[: self.axis]
+                + [self.num]
+                + output_shape[self.axis :]
+            )
+        else:
+            output_shape = (
+                output_shape[: self.axis + 1]
+                + [self.num]
+                + output_shape[self.axis + 1 :]
+            )
+        dtype = (
+            self.dtype
+            if self.dtype is not None
+            else getattr(start, "dtype", type(start))
+        )
+        dtype = backend.result_type(dtype, float)
+        return KerasTensor(output_shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.logspace", "keras.ops.numpy.logspace"])
+def logspace(start, stop, num=50, endpoint=True, base=10, dtype=None, axis=0):
+    """Returns numbers spaced evenly on a log scale.
+
+    In linear space, the sequence starts at `base ** start` and ends with
+    `base ** stop` (see `endpoint` below).
+
+    Args:
+        start: The starting value of the sequence.
+        stop: The final value of the sequence, unless `endpoint` is `False`.
+            In that case, `num + 1` values are spaced over the interval in
+            log-space, of which all but the last (a sequence of length `num`)
+            are returned.
+        num: Number of samples to generate. Defaults to `50`.
+        endpoint: If `True`, `stop` is the last sample. Otherwise, it is not
+            included. Defaults to `True`.
+        base: The base of the log space. Defaults to `10`.
+        dtype: The type of the output tensor.
+        axis: The axis in the result to store the samples. Relevant only
+            if start or stop are array-like.
+
+    Note:
+        Torch backend does not support `axis` argument.
+
+    Returns:
+        A tensor of evenly spaced samples on a log scale.
+    """
+    if any_symbolic_tensors((start, stop)):
+        return Logspace(num, endpoint, base, dtype, axis)(start, stop)
+    return backend.numpy.logspace(
+        start,
+        stop,
+        num=num,
+        endpoint=endpoint,
+        base=base,
+        dtype=dtype,
+        axis=axis,
+    )
+
+
+class Matmul(Operation):
+    def call(self, x1, x2):
+        return backend.numpy.matmul(x1, x2)
+
+    def compute_output_spec(self, x1, x2):
+        x1_shape = getattr(x1, "shape", [])
+        x2_shape = getattr(x2, "shape", [])
+        output_shape = operation_utils.compute_matmul_output_shape(
+            x1_shape, x2_shape
+        )
+        x1_sparse = getattr(x1, "sparse", True)
+        x2_sparse = getattr(x2, "sparse", True)
+        output_sparse = x1_sparse and x2_sparse
+        x1_dtype = backend.standardize_dtype(getattr(x1, "dtype", type(x1)))
+        x2_dtype = backend.standardize_dtype(getattr(x2, "dtype", type(x2)))
+        if x1_dtype == "int8" and x2_dtype == "int8":
+            dtype = "int32"
+        else:
+            dtype = dtypes.result_type(x1_dtype, x2_dtype)
+        return KerasTensor(output_shape, dtype=dtype, sparse=output_sparse)
+
+
+@keras_export(["keras.ops.matmul", "keras.ops.numpy.matmul"])
+def matmul(x1, x2):
+    """Matrix product of two tensors.
+
+    - If both tensors are 1-dimensional, the dot product (scalar) is returned.
+    - If either tensor is N-D, N > 2, it is treated as a stack of matrices
+      residing in the last two indexes and broadcast accordingly.
+    - If the first tensor is 1-D, it is promoted to a matrix by prepending
+      a 1 to its dimensions. After matrix multiplication the prepended
+      1 is removed.
+    - If the second tensor is 1-D, it is promoted to a matrix by appending a 1
+      to its dimensions. After matrix multiplication the appended 1 is removed.
+
+    Args:
+        x1: First tensor.
+        x2: Second tensor.
+
+    Returns:
+        Output tensor, matrix product of the inputs.
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return Matmul().symbolic_call(x1, x2)
+    return backend.numpy.matmul(x1, x2)
+
+
+class Max(Operation):
+    def __init__(self, axis=None, keepdims=False, initial=None):
+        super().__init__()
+        if isinstance(axis, int):
+            self.axis = [axis]
+        else:
+            self.axis = axis
+        self.keepdims = keepdims
+        self.initial = initial
+
+    def call(self, x):
+        return backend.numpy.max(
+            x, axis=self.axis, keepdims=self.keepdims, initial=self.initial
+        )
+
+    def compute_output_spec(self, x):
+        return KerasTensor(
+            reduce_shape(x.shape, axis=self.axis, keepdims=self.keepdims),
+            dtype=x.dtype,
+        )
+
+
+@keras_export(["keras.ops.max", "keras.ops.numpy.max"])
+def max(x, axis=None, keepdims=False, initial=None):
+    """Return the maximum of a tensor or maximum along an axis.
+
+    Args:
+        x: Input tensor.
+        axis: Axis or axes along which to operate. By default, flattened input
+            is used.
+        keepdims: If this is set to `True`, the axes which are reduced are left
+            in the result as dimensions with size one. Defaults to `False`.
+        initial: The minimum value of an output element. Defaults to `None`.
+
+    Returns:
+        Maximum of `x`.
+    """
+    if any_symbolic_tensors((x,)):
+        return Max(axis=axis, keepdims=keepdims, initial=initial).symbolic_call(
+            x
+        )
+    return backend.numpy.max(x, axis=axis, keepdims=keepdims, initial=initial)
+
+
+class Maximum(Operation):
+    def call(self, x1, x2):
+        return backend.numpy.maximum(x1, x2)
+
+    def compute_output_spec(self, x1, x2):
+        x1_shape = getattr(x1, "shape", [])
+        x2_shape = getattr(x2, "shape", [])
+        output_shape = broadcast_shapes(x1_shape, x2_shape)
+        output_dtype = dtypes.result_type(
+            getattr(x1, "dtype", type(x1)),
+            getattr(x2, "dtype", type(x2)),
+        )
+        x1_sparse = getattr(x1, "sparse", False)
+        x2_sparse = getattr(x2, "sparse", False)
+        output_sparse = x1_sparse and x2_sparse
+        return KerasTensor(
+            output_shape, dtype=output_dtype, sparse=output_sparse
+        )
+
+
+@keras_export(["keras.ops.maximum", "keras.ops.numpy.maximum"])
+def maximum(x1, x2):
+    """Element-wise maximum of `x1` and `x2`.
+
+    Args:
+        x1: First tensor.
+        x2: Second tensor.
+
+    Returns:
+        Output tensor, element-wise maximum of `x1` and `x2`.
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return Maximum().symbolic_call(x1, x2)
+    return backend.numpy.maximum(x1, x2)
+
+
+class Median(Operation):
+    def __init__(self, axis=None, keepdims=False):
+        super().__init__()
+        if isinstance(axis, int):
+            axis = [axis]
+        self.axis = axis
+        self.keepdims = keepdims
+
+    def call(self, x):
+        return backend.numpy.median(x, axis=self.axis, keepdims=self.keepdims)
+
+    def compute_output_spec(self, x):
+        output_shape = reduce_shape(
+            x.shape, axis=self.axis, keepdims=self.keepdims
+        )
+        if backend.standardize_dtype(x.dtype) == "int64":
+            dtype = backend.floatx()
+        else:
+            dtype = dtypes.result_type(x.dtype, float)
+        return KerasTensor(output_shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.median", "keras.ops.numpy.median"])
+def median(x, axis=None, keepdims=False):
+    """Compute the median along the specified axis.
+
+    Args:
+        x: Input tensor.
+        axis: Axis or axes along which the medians are computed. Defaults to
+            `axis=None` which is to compute the median(s) along a flattened
+            version of the array.
+        keepdims: If this is set to `True`, the axes which are reduce
+            are left in the result as dimensions with size one.
+
+    Returns:
+        The output tensor.
+    """
+    if any_symbolic_tensors((x,)):
+        return Median(axis=axis, keepdims=keepdims).symbolic_call(x)
+    return backend.numpy.median(x, axis=axis, keepdims=keepdims)
+
+
+class Meshgrid(Operation):
+    def __init__(self, indexing="xy"):
+        super().__init__()
+        if indexing not in ("xy", "ij"):
+            raise ValueError(
+                "Valid values for `indexing` are 'xy' and 'ij', "
+                "but received {index}."
+            )
+        self.indexing = indexing
+
+    def call(self, *x):
+        return backend.numpy.meshgrid(*x, indexing=self.indexing)
+
+    def compute_output_spec(self, *x):
+        output_shape = []
+        for xi in x:
+            if len(xi.shape) == 0:
+                size = 1
+            else:
+                if None in xi.shape:
+                    size = None
+                else:
+                    size = int(np.prod(xi.shape))
+            output_shape.append(size)
+        if self.indexing == "ij":
+            return [KerasTensor(output_shape) for _ in range(len(x))]
+        tmp = output_shape[0]
+        output_shape[0] = output_shape[1]
+        output_shape[1] = tmp
+        return [
+            KerasTensor(output_shape, dtype=xi.dtype) for _ in range(len(x))
+        ]
+
+
+@keras_export(["keras.ops.meshgrid", "keras.ops.numpy.meshgrid"])
+def meshgrid(*x, indexing="xy"):
+    """Creates grids of coordinates from coordinate vectors.
+
+    Given `N` 1-D tensors `T0, T1, ..., TN-1` as inputs with corresponding
+    lengths `S0, S1, ..., SN-1`, this creates an `N` N-dimensional tensors
+    `G0, G1, ..., GN-1` each with shape `(S0, ..., SN-1)` where the output
+    `Gi` is constructed by expanding `Ti` to the result shape.
+
+    Args:
+        x: 1-D tensors representing the coordinates of a grid.
+        indexing: `"xy"` or `"ij"`. "xy" is cartesian; `"ij"` is matrix
+            indexing of output. Defaults to `"xy"`.
+
+    Returns:
+        Sequence of N tensors.
+
+    Example:
+    >>> from keras.src import ops
+    >>> x = ops.array([1, 2, 3])
+    >>> y = ops.array([4, 5, 6])
+
+    >>> grid_x, grid_y = ops.meshgrid(x, y, indexing="ij")
+    >>> grid_x
+    array([[1, 1, 1],
+           [2, 2, 2],
+           [3, 3, 3]])
+    >>> grid_y
+    array([[4, 5, 6],
+           [4, 5, 6],
+           [4, 5, 6]])
+    """
+    if any_symbolic_tensors(x):
+        return Meshgrid(indexing=indexing).symbolic_call(*x)
+    return backend.numpy.meshgrid(*x, indexing=indexing)
+
+
+class Min(Operation):
+    def __init__(self, axis=None, keepdims=False, initial=None):
+        super().__init__()
+        if isinstance(axis, int):
+            self.axis = [axis]
+        else:
+            self.axis = axis
+        self.keepdims = keepdims
+        self.initial = initial
+
+    def call(self, x):
+        return backend.numpy.min(
+            x, axis=self.axis, keepdims=self.keepdims, initial=self.initial
+        )
+
+    def compute_output_spec(self, x):
+        return KerasTensor(
+            reduce_shape(x.shape, axis=self.axis, keepdims=self.keepdims),
+            dtype=x.dtype,
+        )
+
+
+@keras_export(["keras.ops.min", "keras.ops.numpy.min"])
+def min(x, axis=None, keepdims=False, initial=None):
+    """Return the minimum of a tensor or minimum along an axis.
+
+    Args:
+        x: Input tensor.
+        axis: Axis or axes along which to operate. By default, flattened input
+            is used.
+        keepdims: If this is set to `True`, the axes which are reduced are left
+            in the result as dimensions with size one. Defaults to `False`.
+        initial: The maximum value of an output element. Defaults to `None`.
+
+    Returns:
+        Minimum of `x`.
+    """
+    if any_symbolic_tensors((x,)):
+        return Min(axis=axis, keepdims=keepdims, initial=initial).symbolic_call(
+            x
+        )
+    return backend.numpy.min(x, axis=axis, keepdims=keepdims, initial=initial)
+
+
+class Minimum(Operation):
+    def call(self, x1, x2):
+        return backend.numpy.minimum(x1, x2)
+
+    def compute_output_spec(self, x1, x2):
+        x1_shape = getattr(x1, "shape", [])
+        x2_shape = getattr(x2, "shape", [])
+        output_shape = broadcast_shapes(x1_shape, x2_shape)
+        output_dtype = dtypes.result_type(
+            getattr(x1, "dtype", type(x1)),
+            getattr(x2, "dtype", type(x2)),
+        )
+        x1_sparse = getattr(x1, "sparse", False)
+        x2_sparse = getattr(x2, "sparse", False)
+        output_sparse = x1_sparse and x2_sparse
+        return KerasTensor(
+            output_shape, dtype=output_dtype, sparse=output_sparse
+        )
+
+
+@keras_export(["keras.ops.minimum", "keras.ops.numpy.minimum"])
+def minimum(x1, x2):
+    """Element-wise minimum of `x1` and `x2`.
+
+    Args:
+        x1: First tensor.
+        x2: Second tensor.
+
+    Returns:
+        Output tensor, element-wise minimum of `x1` and `x2`.
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return Minimum().symbolic_call(x1, x2)
+    return backend.numpy.minimum(x1, x2)
+
+
+class Mod(Operation):
+    def call(self, x1, x2):
+        return backend.numpy.mod(x1, x2)
+
+    def compute_output_spec(self, x1, x2):
+        x1_shape = getattr(x1, "shape", [])
+        x2_shape = getattr(x2, "shape", [])
+        output_shape = broadcast_shapes(x1_shape, x2_shape)
+        output_dtype = dtypes.result_type(
+            getattr(x1, "dtype", type(x1)),
+            getattr(x2, "dtype", type(x2)),
+        )
+        if output_dtype == "bool":
+            output_dtype = "int32"
+        return KerasTensor(output_shape, dtype=output_dtype)
+
+
+@keras_export(["keras.ops.mod", "keras.ops.numpy.mod"])
+def mod(x1, x2):
+    """Returns the element-wise remainder of division.
+
+    Args:
+        x1: First tensor.
+        x2: Second tensor.
+
+    Returns:
+        Output tensor, element-wise remainder of division.
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return Mod().symbolic_call(x1, x2)
+    return backend.numpy.mod(x1, x2)
+
+
+class Moveaxis(Operation):
+    def __init__(self, source, destination):
+        super().__init__()
+        if isinstance(source, int):
+            self.source = [source]
+        else:
+            self.source = source
+        if isinstance(destination, int):
+            self.destination = [destination]
+        else:
+            self.destination = destination
+
+        if len(self.source) != len(self.destination):
+            raise ValueError(
+                "`source` and `destination` arguments must have the same "
+                f"number of elements, but received `source={source}` and "
+                f"`destination={destination}`."
+            )
+
+    def call(self, x):
+        return backend.numpy.moveaxis(x, self.source, self.destination)
+
+    def compute_output_spec(self, x):
+        x_shape = list(x.shape)
+        output_shape = [-1 for _ in range(len(x.shape))]
+        for sc, dst in zip(self.source, self.destination):
+            output_shape[dst] = x_shape[sc]
+            x_shape[sc] = -1
+        i, j = 0, 0
+        while i < len(output_shape):
+            while i < len(output_shape) and output_shape[i] != -1:
+                # Find the first dim unset.
+                i += 1
+            while j < len(output_shape) and x_shape[j] == -1:
+                # Find the first dim not being passed.
+                j += 1
+            if i == len(output_shape):
+                break
+            output_shape[i] = x_shape[j]
+            i += 1
+            j += 1
+        return KerasTensor(output_shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.moveaxis", "keras.ops.numpy.moveaxis"])
+def moveaxis(x, source, destination):
+    """Move axes of a tensor to new positions.
+
+    Other axes remain in their original order.
+
+    Args:
+        x: Tensor whose axes should be reordered.
+        source: Original positions of the axes to move. These must be unique.
+        destination: Destinations positions for each of the original axes.
+            These must also be unique.
+
+    Returns:
+        Tensor with moved axes.
+    """
+    if any_symbolic_tensors((x,)):
+        return Moveaxis(source, destination).symbolic_call(x)
+    return backend.numpy.moveaxis(x, source=source, destination=destination)
+
+
+class NanToNum(Operation):
+    def __init__(self, nan=0.0, posinf=None, neginf=None):
+        super().__init__()
+        self.nan = nan
+        self.posinf = posinf
+        self.neginf = neginf
+
+    def call(self, x):
+        return backend.numpy.nan_to_num(
+            x, nan=self.nan, posinf=self.posinf, neginf=self.neginf
+        )
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(
+    [
+        "keras.ops.nan_to_num",
+        "keras.ops.numpy.nan_to_num",
+    ]
+)
+def nan_to_num(x, nan=0.0, posinf=None, neginf=None):
+    """Replace NaN with zero and infinity with large finite numbers.
+
+    Args:
+        x: Input data.
+        nan: Optional float or int. Value to replace `NaN` entries with.
+        posinf: Optional float or int.
+            Value to replace positive infinity with.
+        neginf: Optional float or int.
+            Value to replace negative infinity with.
+
+    Returns:
+        `x`, with non-finite values replaced.
+    """
+    if any_symbolic_tensors((x,)):
+        return NanToNum(nan=nan, posinf=posinf, neginf=neginf).symbolic_call(x)
+    return backend.numpy.nan_to_num(x, nan=nan, posinf=posinf, neginf=neginf)
+
+
+class Ndim(Operation):
+    def call(self, x):
+        return backend.numpy.ndim(
+            x,
+        )
+
+    def compute_output_spec(self, x):
+        return KerasTensor([len(x.shape)])
+
+
+@keras_export(["keras.ops.ndim", "keras.ops.numpy.ndim"])
+def ndim(x):
+    """Return the number of dimensions of a tensor.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        The number of dimensions in `x`.
+    """
+    if any_symbolic_tensors((x,)):
+        return Ndim().symbolic_call(x)
+    return backend.numpy.ndim(x)
+
+
+class Nonzero(Operation):
+    def call(self, x):
+        return backend.numpy.nonzero(x)
+
+    def compute_output_spec(self, x):
+        return tuple(
+            [KerasTensor((None,), dtype="int32") for _ in range(len(x.shape))]
+        )
+
+
+@keras_export(["keras.ops.nonzero", "keras.ops.numpy.nonzero"])
+def nonzero(x):
+    """Return the indices of the elements that are non-zero.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        Indices of elements that are non-zero.
+    """
+    if any_symbolic_tensors((x,)):
+        return Nonzero().symbolic_call(x)
+    return backend.numpy.nonzero(x)
+
+
+class NotEqual(Operation):
+    def call(self, x1, x2):
+        return backend.numpy.not_equal(x1, x2)
+
+    def compute_output_spec(self, x1, x2):
+        x1_shape = getattr(x1, "shape", [])
+        x2_shape = getattr(x2, "shape", [])
+        output_shape = broadcast_shapes(x1_shape, x2_shape)
+        return KerasTensor(output_shape, dtype="bool")
+
+
+@keras_export(["keras.ops.not_equal", "keras.ops.numpy.not_equal"])
+def not_equal(x1, x2):
+    """Return `(x1 != x2)` element-wise.
+
+    Args:
+        x1: First input tensor.
+        x2: Second input tensor.
+
+    Returns:
+        Output tensor, element-wise comparison of `x1` and `x2`.
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return NotEqual().symbolic_call(x1, x2)
+    return backend.numpy.not_equal(x1, x2)
+
+
+class OnesLike(Operation):
+    def call(self, x, dtype=None):
+        return backend.numpy.ones_like(x, dtype=dtype)
+
+    def compute_output_spec(self, x, dtype=None):
+        if dtype is None:
+            dtype = x.dtype
+        return KerasTensor(x.shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.ones_like", "keras.ops.numpy.ones_like"])
+def ones_like(x, dtype=None):
+    """Return a tensor of ones with the same shape and type of `x`.
+
+    Args:
+        x: Input tensor.
+        dtype: Overrides the data type of the result.
+
+    Returns:
+        A tensor of ones with the same shape and type as `x`.
+    """
+    if any_symbolic_tensors((x,)):
+        return OnesLike().symbolic_call(x, dtype=dtype)
+    return backend.numpy.ones_like(x, dtype=dtype)
+
+
+class ZerosLike(Operation):
+    def call(self, x, dtype=None):
+        return backend.numpy.zeros_like(x, dtype=dtype)
+
+    def compute_output_spec(self, x, dtype=None):
+        if dtype is None:
+            dtype = x.dtype
+        return KerasTensor(x.shape, dtype=dtype)
+
+
+@keras_export(
+    [
+        "keras.ops.zeros_like",
+        "keras.ops.numpy.zeros_like",
+    ]
+)
+def zeros_like(x, dtype=None):
+    """Return a tensor of zeros with the same shape and type as `x`.
+
+    Args:
+        x: Input tensor.
+        dtype: Overrides the data type of the result.
+
+    Returns:
+        A tensor of zeros with the same shape and type as `x`.
+    """
+    if any_symbolic_tensors((x,)):
+        return ZerosLike().symbolic_call(x, dtype=dtype)
+    return backend.numpy.zeros_like(x, dtype=dtype)
+
+
+class Outer(Operation):
+    def call(self, x1, x2):
+        return backend.numpy.outer(x1, x2)
+
+    def compute_output_spec(self, x1, x2):
+        x1_shape = getattr(x1, "shape", [1])
+        x2_shape = getattr(x2, "shape", [1])
+        if None in x1_shape:
+            x1_flatten_shape = None
+        else:
+            x1_flatten_shape = int(np.prod(x1_shape))
+        if None in x2_shape:
+            x2_flatten_shape = None
+        else:
+            x2_flatten_shape = int(np.prod(x2_shape))
+        output_shape = [x1_flatten_shape, x2_flatten_shape]
+        output_dtype = backend.result_type(
+            getattr(x1, "dtype", type(x1)),
+            getattr(x2, "dtype", type(x2)),
+        )
+        return KerasTensor(output_shape, dtype=output_dtype)
+
+
+@keras_export(["keras.ops.outer", "keras.ops.numpy.outer"])
+def outer(x1, x2):
+    """Compute the outer product of two vectors.
+
+    Given two vectors `x1` and `x2`, the outer product is:
+
+    ```
+    out[i, j] = x1[i] * x2[j]
+    ```
+
+    Args:
+        x1: First input tensor.
+        x2: Second input tensor.
+
+    Returns:
+        Outer product of `x1` and `x2`.
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return Outer().symbolic_call(x1, x2)
+    return backend.numpy.outer(x1, x2)
+
+
+class Pad(Operation):
+    def __init__(self, pad_width, mode="constant"):
+        super().__init__()
+        self.pad_width = self._process_pad_width(pad_width)
+        self.mode = mode
+
+    def _process_pad_width(self, pad_width):
+        if isinstance(pad_width, int):
+            return ((pad_width, pad_width),)
+        if isinstance(pad_width, (tuple, list)) and isinstance(
+            pad_width[0], int
+        ):
+            return (pad_width,)
+        first_len = len(pad_width[0])
+        for i, pw in enumerate(pad_width):
+            if len(pw) != first_len:
+                raise ValueError(
+                    "`pad_width` should be a list of tuples of length "
+                    f"1 or 2. Received: pad_width={pad_width}"
+                )
+            if len(pw) == 1:
+                pad_width[i] = (pw[0], pw[0])
+        return pad_width
+
+    def call(self, x, constant_values=None):
+        if len(self.pad_width) > 1 and len(self.pad_width) != len(x.shape):
+            raise ValueError(
+                "`pad_width` must have the same length as `x.shape`. "
+                f"Received: pad_width={self.pad_width} "
+                f"(of length {len(self.pad_width)}) and x.shape={x.shape} "
+                f"(of length {len(x.shape)})"
+            )
+        return backend.numpy.pad(
+            x,
+            pad_width=self.pad_width,
+            mode=self.mode,
+            constant_values=constant_values,
+        )
+
+    def compute_output_spec(self, x, constant_values=None):
+        output_shape = list(x.shape)
+        if len(self.pad_width) == 1:
+            pad_width = [self.pad_width[0] for _ in range(len(output_shape))]
+        elif len(self.pad_width) == len(output_shape):
+            pad_width = self.pad_width
+        else:
+            raise ValueError(
+                "`pad_width` must have the same length as `x.shape`. "
+                f"Received: pad_width={self.pad_width} "
+                f"(of length {len(self.pad_width)}) and x.shape={x.shape} "
+                f"(of length {len(x.shape)})"
+            )
+
+        for i in range(len(output_shape)):
+            if output_shape[i] is None:
+                output_shape[i] = None
+            else:
+                output_shape[i] += pad_width[i][0] + pad_width[i][1]
+        return KerasTensor(output_shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.pad", "keras.ops.numpy.pad"])
+def pad(x, pad_width, mode="constant", constant_values=None):
+    """Pad a tensor.
+
+    Args:
+        x: Tensor to pad.
+        pad_width: Number of values padded to the edges of each axis.
+            `((before_1, after_1), ...(before_N, after_N))` unique pad
+            widths for each axis.
+            `((before, after),)` yields same before and after pad for
+            each axis.
+            `(pad,)` or `int` is a shortcut for `before = after = pad`
+            width for all axes.
+        mode: One of `"constant"`, `"edge"`, `"linear_ramp"`,
+            `"maximum"`, `"mean"`, `"median"`, `"minimum"`,
+            `"reflect"`, `"symmetric"`, `"wrap"`, `"empty"`,
+            `"circular"`. Defaults to `"constant"`.
+        constant_values: value to pad with if `mode == "constant"`.
+            Defaults to `0`. A `ValueError` is raised if not None and
+            `mode != "constant"`.
+
+    Note:
+        Torch backend only supports modes `"constant"`, `"reflect"`,
+        `"symmetric"` and `"circular"`.
+        Only Torch backend supports `"circular"` mode.
+
+    Note:
+        Tensorflow backend only supports modes `"constant"`, `"reflect"`
+        and `"symmetric"`.
+
+    Returns:
+        Padded tensor.
+    """
+    return Pad(pad_width, mode=mode)(x, constant_values=constant_values)
+
+
+class Prod(Operation):
+    def __init__(self, axis=None, keepdims=False, dtype=None):
+        super().__init__()
+        if isinstance(axis, int):
+            self.axis = [axis]
+        else:
+            self.axis = axis
+        self.keepdims = keepdims
+        self.dtype = dtype
+
+    def call(self, x):
+        return backend.numpy.prod(
+            x,
+            axis=self.axis,
+            keepdims=self.keepdims,
+            dtype=self.dtype,
+        )
+
+    def compute_output_spec(self, x):
+        if self.dtype is not None:
+            dtype = self.dtype
+        else:
+            dtype = backend.result_type(x.dtype)
+            if dtype == "bool":
+                dtype = "int32"
+            elif dtype in ("int8", "int16"):
+                dtype = "int32"
+            elif dtype in ("uint8", "uint16"):
+                dtype = "uint32"
+        # TODO: torch doesn't support uint32
+        if backend.backend() == "torch" and dtype == "uint32":
+            dtype = "int32"
+        return KerasTensor(
+            reduce_shape(x.shape, axis=self.axis, keepdims=self.keepdims),
+            dtype=dtype,
+        )
+
+
+@keras_export(["keras.ops.prod", "keras.ops.numpy.prod"])
+def prod(x, axis=None, keepdims=False, dtype=None):
+    """Return the product of tensor elements over a given axis.
+
+    Args:
+        x: Input tensor.
+        axis: Axis or axes along which a product is performed. The default,
+            `axis=None`, will compute the product of all elements
+            in the input tensor.
+        keepdims: If this is set to `True`, the axes which are reduce
+            are left in the result as dimensions with size one.
+        dtype: Data type of the returned tensor.
+
+    Returns:
+        Product of elements of `x` over the given axis or axes.
+    """
+    if any_symbolic_tensors((x,)):
+        return Prod(axis=axis, keepdims=keepdims, dtype=dtype).symbolic_call(x)
+    return backend.numpy.prod(x, axis=axis, keepdims=keepdims, dtype=dtype)
+
+
+class Quantile(Operation):
+    def __init__(self, axis=None, method="linear", keepdims=False):
+        super().__init__()
+        if isinstance(axis, int):
+            axis = [axis]
+        self.axis = axis
+        self.method = method
+        self.keepdims = keepdims
+
+    def call(self, x, q):
+        return backend.numpy.quantile(
+            x, q, axis=self.axis, keepdims=self.keepdims
+        )
+
+    def compute_output_spec(self, x, q):
+        output_shape = reduce_shape(
+            x.shape, axis=self.axis, keepdims=self.keepdims
+        )
+        if hasattr(q, "shape"):
+            if len(q.shape) > 0:
+                output_shape = (q.shape[0],) + output_shape
+        if backend.standardize_dtype(x.dtype) == "int64":
+            dtype = backend.floatx()
+        else:
+            dtype = dtypes.result_type(x.dtype, float)
+        return KerasTensor(output_shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.quantile", "keras.ops.numpy.quantile"])
+def quantile(x, q, axis=None, method="linear", keepdims=False):
+    """Compute the q-th quantile(s) of the data along the specified axis.
+
+    Args:
+        x: Input tensor.
+        q: Probability or sequence of probabilities for the quantiles to
+            compute. Values must be between 0 and 1 inclusive.
+        axis: Axis or axes along which the quantiles are computed. Defaults to
+            `axis=None` which is to compute the quantile(s) along a flattened
+            version of the array.
+        method: A string specifies the method to use for estimating the
+            quantile. Available methods are `"linear"`, `"lower"`, `"higher"`,
+            `"midpoint"`, and `"nearest"`. Defaults to `"linear"`.
+            If the desired quantile lies between two data points `i < j`:
+            - `"linear"`: `i + (j - i) * fraction`, where fraction is the
+                fractional part of the index surrounded by `i` and `j`.
+            - `"lower"`: `i`.
+            - `"higher"`: `j`.
+            - `"midpoint"`: `(i + j) / 2`
+            - `"nearest"`: `i` or `j`, whichever is nearest.
+        keepdims: If this is set to `True`, the axes which are reduce
+            are left in the result as dimensions with size one.
+
+    Returns:
+        The quantile(s). If `q` is a single probability and `axis=None`, then
+        the result is a scalar. If multiple probabilities levels are given,
+        first axis of the result corresponds to the quantiles. The other axes
+        are the axes that remain after the reduction of `x`.
+    """
+    if any_symbolic_tensors((x, q)):
+        return Quantile(
+            axis=axis, method=method, keepdims=keepdims
+        ).symbolic_call(x, q)
+    return backend.numpy.quantile(
+        x, q, axis=axis, method=method, keepdims=keepdims
+    )
+
+
+class Ravel(Operation):
+    def call(self, x):
+        return backend.numpy.ravel(x)
+
+    def compute_output_spec(self, x):
+        if None in x.shape:
+            output_shape = [
+                None,
+            ]
+        else:
+            output_shape = [int(np.prod(x.shape))]
+        return KerasTensor(output_shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.ravel", "keras.ops.numpy.ravel"])
+def ravel(x):
+    """Return a contiguous flattened tensor.
+
+    A 1-D tensor, containing the elements of the input, is returned.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        Output tensor.
+    """
+    if any_symbolic_tensors((x,)):
+        return Ravel().symbolic_call(x)
+    return backend.numpy.ravel(x)
+
+
+class UnravelIndex(Operation):
+    def __init__(self, shape):
+        self.shape = shape
+        self._inbound_nodes = []
+
+    def call(self, indices):
+        return backend.numpy.unravel_index(indices, self.shape)
+
+    def compute_output_spec(self, indices):
+        if None in self.shape:
+            output_shapes = [[None] for _ in self.shape]
+        else:
+            if isinstance(indices, int):
+                output_shapes = [[1] for _ in self.shape]
+            elif hasattr(indices, "shape"):
+                output_shapes = [list(indices.shape) for _ in self.shape]
+            else:
+                try:
+                    indices_shape = np.shape(indices)
+                    output_shapes = [list(indices_shape) for _ in self.shape]
+                except Exception:
+                    output_shapes = [[None] for _ in self.shape]
+
+        return [
+            KerasTensor(shape, dtype=indices.dtype) for shape in output_shapes
+        ]
+
+
+@keras_export(["keras.ops.unravel_index", "keras.ops.numpy.unravel_index"])
+def unravel_index(indices, shape):
+    """Convert flat indices to coordinate arrays in a given array shape.
+
+    Args:
+        indices: An integer or array of integers representing flat indices.
+        shape: The shape of the array to unravel into.
+
+    Returns:
+        Tuple of arrays for each dimension with unraveled indices.
+
+    Example:
+        >>> indices = 5
+        >>> shape = (3, 3)
+        >>> unravel_index(indices, shape)
+        (1, 2)  # 5 is at row 1, column 2 in a 3x3 array
+    """
+    if any_symbolic_tensors((indices,)):
+        return UnravelIndex(shape).symbolic_call(indices)
+
+    return backend.numpy.unravel_index(indices, shape)
+
+
+class Real(Operation):
+    def call(self, x):
+        return backend.numpy.real(x)
+
+    def compute_output_spec(self, x):
+        sparse = getattr(x, "sparse", False)
+        return KerasTensor(x.shape, dtype=x.dtype, sparse=sparse)
+
+
+@keras_export(["keras.ops.real", "keras.ops.numpy.real"])
+def real(x):
+    """Return the real part of the complex argument.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        The real component of the complex argument.
+    """
+    if any_symbolic_tensors((x,)):
+        return Real().symbolic_call(x)
+    return backend.numpy.real(x)
+
+
+class Reciprocal(Operation):
+    def call(self, x):
+        return backend.numpy.reciprocal(x)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape)
+
+
+@keras_export(
+    [
+        "keras.ops.reciprocal",
+        "keras.ops.numpy.reciprocal",
+    ]
+)
+def reciprocal(x):
+    """Return the reciprocal of the argument, element-wise.
+
+    Calculates `1/x`.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        Output tensor, element-wise reciprocal of `x`.
+    """
+    if any_symbolic_tensors((x,)):
+        return Reciprocal().symbolic_call(x)
+    return backend.numpy.reciprocal(x)
+
+
+class Repeat(Operation):
+    def __init__(self, repeats, axis=None):
+        super().__init__()
+        self.axis = axis
+        self.repeats = repeats
+
+    def call(self, x):
+        return backend.numpy.repeat(x, self.repeats, axis=self.axis)
+
+    def compute_output_spec(self, x):
+        x_shape = list(x.shape)
+        repeats = self.repeats
+        if isinstance(repeats, int):
+            repeats = [repeats]
+        repeats_size = len(repeats)
+        broadcast = repeats_size == 1
+
+        if self.axis is None:
+            if None in x_shape:
+                return KerasTensor([None], dtype=x.dtype)
+
+            x_flatten_size = int(np.prod(x_shape))
+            if broadcast:
+                output_shape = [x_flatten_size * repeats[0]]
+            elif repeats_size != x_flatten_size:
+                raise ValueError(
+                    "Size of `repeats` and "
+                    "dimensions of `x` after flattening should be compatible. "
+                    f"Received: {repeats_size} and {x_flatten_size}"
+                )
+            else:
+                output_shape = [int(np.sum(repeats))]
+            return KerasTensor(output_shape, dtype=x.dtype)
+
+        size_on_ax = x_shape[self.axis]
+        if size_on_ax is None:
+            return KerasTensor(x_shape, dtype=x.dtype)
+
+        output_shape = x_shape
+        if broadcast:
+            output_shape[self.axis] = size_on_ax * repeats[0]
+        elif size_on_ax != repeats_size:
+            raise ValueError(
+                "Size of `repeats` and "
+                f"dimensions of `axis {self.axis} of x` should be compatible. "
+                f"Received: {repeats_size} and {x_shape}"
+            )
+        else:
+            output_shape[self.axis] = int(np.sum(repeats))
+        return KerasTensor(output_shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.repeat", "keras.ops.numpy.repeat"])
+def repeat(x, repeats, axis=None):
+    """Repeat each element of a tensor after themselves.
+
+    Args:
+        x: Input tensor.
+        repeats: The number of repetitions for each element.
+        axis: The axis along which to repeat values. By default, use
+            the flattened input array, and return a flat output array.
+
+    Returns:
+        Output tensor.
+    """
+    if any_symbolic_tensors((x,)):
+        return Repeat(repeats, axis=axis).symbolic_call(x)
+    return backend.numpy.repeat(x, repeats, axis=axis)
+
+
+class Reshape(Operation):
+    def __init__(self, newshape):
+        super().__init__()
+        self.newshape = newshape
+
+    def call(self, x):
+        return backend.numpy.reshape(x, self.newshape)
+
+    def compute_output_spec(self, x):
+        output_shape = operation_utils.compute_reshape_output_shape(
+            x.shape, self.newshape, "newshape"
+        )
+        sparse = getattr(x, "sparse", False)
+        return KerasTensor(output_shape, dtype=x.dtype, sparse=sparse)
+
+
+@keras_export(["keras.ops.reshape", "keras.ops.numpy.reshape"])
+def reshape(x, newshape):
+    """Gives a new shape to a tensor without changing its data.
+
+    Args:
+        x: Input tensor.
+        newshape: The new shape should be compatible with the original shape.
+            One shape dimension can be -1 in which case the value is
+            inferred from the length of the array and remaining dimensions.
+
+    Returns:
+        The reshaped tensor.
+    """
+    if any_symbolic_tensors((x,)):
+        return Reshape(newshape).symbolic_call(x)
+    return backend.numpy.reshape(x, newshape)
+
+
+class Roll(Operation):
+    def __init__(self, shift, axis=None):
+        super().__init__()
+        self.shift = shift
+        self.axis = axis
+
+    def call(self, x):
+        return backend.numpy.roll(x, self.shift, self.axis)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.roll", "keras.ops.numpy.roll"])
+def roll(x, shift, axis=None):
+    """Roll tensor elements along a given axis.
+
+    Elements that roll beyond the last position are re-introduced at the first.
+
+    Args:
+        x: Input tensor.
+        shift: The number of places by which elements are shifted.
+        axis: The axis along which elements are shifted. By default, the
+            array is flattened before shifting, after which the original
+            shape is restored.
+
+    Returns:
+        Output tensor.
+    """
+    if any_symbolic_tensors((x,)):
+        return Roll(shift, axis=axis).symbolic_call(x)
+    return backend.numpy.roll(x, shift, axis=axis)
+
+
+class Round(Operation):
+    def __init__(self, decimals=0):
+        super().__init__()
+        self.decimals = decimals
+
+    def call(self, x):
+        return backend.numpy.round(x, self.decimals)
+
+    def compute_output_spec(self, x):
+        sparse = getattr(x, "sparse", False)
+        return KerasTensor(x.shape, dtype=x.dtype, sparse=sparse)
+
+
+@keras_export(["keras.ops.round", "keras.ops.numpy.round"])
+def round(x, decimals=0):
+    """Evenly round to the given number of decimals.
+
+    Args:
+        x: Input tensor.
+        decimals: Number of decimal places to round to. Defaults to `0`.
+
+    Returns:
+        Output tensor.
+    """
+    if any_symbolic_tensors((x,)):
+        return Round(decimals).symbolic_call(x)
+    return backend.numpy.round(x, decimals)
+
+
+class SearchSorted(Operation):
+    def call(self, sorted_sequence, values, side="left"):
+        sorted_sequence = backend.convert_to_tensor(sorted_sequence)
+        values = backend.convert_to_tensor(values)
+        return backend.numpy.searchsorted(sorted_sequence, values, side=side)
+
+    def compute_output_spec(self, sorted_sequence, values, side="left"):
+        if len(sorted_sequence.shape) != 1:
+            raise ValueError(
+                "searchsorted only supports 1-D sorted sequences. Use"
+                "keras.ops.vectorized_map to extend to N-D sequences."
+            )
+        out_type = (
+            "int32"
+            if sorted_sequence.shape[0] <= np.iinfo(np.int32).max
+            else "int64"
+        )
+        return KerasTensor(values.shape, dtype=out_type)
+
+
+@keras_export(["keras.ops.searchsorted"])
+def searchsorted(sorted_sequence, values, side="left"):
+    """Perform a binary search, returning indices for insertion of `values`
+    into `sorted_sequence` that maintain the sorting order.
+
+    Args:
+        sorted_sequence: 1-D input tensor, sorted along the innermost
+            dimension.
+        values: N-D tensor of query insertion values.
+        side: 'left' or 'right', specifying the direction in which to insert
+            for the equality case (tie-breaker).
+
+    Returns:
+        Tensor of insertion indices of same shape as `values`.
+    """
+    if any_symbolic_tensors((sorted_sequence, values)):
+        return SearchSorted().symbolic_call(sorted_sequence, values, side=side)
+
+    sorted_sequence = backend.convert_to_tensor(sorted_sequence)
+    values = backend.convert_to_tensor(values)
+    return backend.numpy.searchsorted(sorted_sequence, values, side=side)
+
+
+class Sign(Operation):
+    def call(self, x):
+        return backend.numpy.sign(x)
+
+    def compute_output_spec(self, x):
+        sparse = getattr(x, "sparse", False)
+        return KerasTensor(x.shape, dtype=x.dtype, sparse=sparse)
+
+
+@keras_export(["keras.ops.sign", "keras.ops.numpy.sign"])
+def sign(x):
+    """Returns a tensor with the signs of the elements of `x`.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        Output tensor of same shape as `x`.
+    """
+    if any_symbolic_tensors((x,)):
+        return Sign().symbolic_call(x)
+    return backend.numpy.sign(x)
+
+
+class Sin(Operation):
+    def call(self, x):
+        return backend.numpy.sin(x)
+
+    def compute_output_spec(self, x):
+        dtype = backend.standardize_dtype(getattr(x, "dtype", backend.floatx()))
+        if dtype == "int64":
+            dtype = backend.floatx()
+        else:
+            dtype = dtypes.result_type(dtype, float)
+        sparse = getattr(x, "sparse", False)
+        return KerasTensor(x.shape, dtype=dtype, sparse=sparse)
+
+
+@keras_export(["keras.ops.sin", "keras.ops.numpy.sin"])
+def sin(x):
+    """Trigonometric sine, element-wise.
+
+    Arguments:
+        x: Input tensor.
+
+    Returns:
+        Output tensor of same shape as `x`.
+    """
+    if any_symbolic_tensors((x,)):
+        return Sin().symbolic_call(x)
+    return backend.numpy.sin(x)
+
+
+class Sinh(Operation):
+    def call(self, x):
+        return backend.numpy.sinh(x)
+
+    def compute_output_spec(self, x):
+        dtype = backend.standardize_dtype(getattr(x, "dtype", backend.floatx()))
+        if dtype == "int64":
+            dtype = backend.floatx()
+        else:
+            dtype = dtypes.result_type(dtype, float)
+        sparse = getattr(x, "sparse", False)
+        return KerasTensor(x.shape, dtype=dtype, sparse=sparse)
+
+
+@keras_export(["keras.ops.sinh", "keras.ops.numpy.sinh"])
+def sinh(x):
+    """Hyperbolic sine, element-wise.
+
+    Arguments:
+        x: Input tensor.
+
+    Returns:
+        Output tensor of same shape as `x`.
+    """
+    if any_symbolic_tensors((x,)):
+        return Sinh().symbolic_call(x)
+    return backend.numpy.sinh(x)
+
+
+class Size(Operation):
+    def call(self, x):
+        return backend.numpy.size(x)
+
+    def compute_output_spec(self, x):
+        return KerasTensor([], dtype="int32")
+
+
+@keras_export(["keras.ops.size", "keras.ops.numpy.size"])
+def size(x):
+    """Return the number of elements in a tensor.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        Number of elements in `x`.
+    """
+    if any_symbolic_tensors((x,)):
+        return Size().symbolic_call(x)
+    return backend.numpy.size(x)
+
+
+class Sort(Operation):
+    def __init__(self, axis=-1):
+        super().__init__()
+        self.axis = axis
+
+    def call(self, x):
+        return backend.numpy.sort(x, axis=self.axis)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, x.dtype)
+
+
+@keras_export(["keras.ops.sort", "keras.ops.numpy.sort"])
+def sort(x, axis=-1):
+    """Sorts the elements of `x` along a given axis in ascending order.
+
+    Args:
+        x: Input tensor.
+        axis: Axis along which to sort. If `None`, the tensor is flattened
+            before sorting. Defaults to `-1`; the last axis.
+
+    Returns:
+        Sorted tensor.
+    """
+    if any_symbolic_tensors((x,)):
+        return Sort(axis=axis).symbolic_call(x)
+    return backend.numpy.sort(x, axis=axis)
+
+
+class Split(Operation):
+    def __init__(self, indices_or_sections, axis=0):
+        super().__init__()
+        if not isinstance(indices_or_sections, int):
+            indices_or_sections = tuple(indices_or_sections)
+        self.indices_or_sections = indices_or_sections
+        self.axis = axis
+
+    def call(self, x):
+        return backend.numpy.split(x, self.indices_or_sections, axis=self.axis)
+
+    def compute_output_spec(self, x):
+        x_shape = list(x.shape)
+        x_size_on_axis = x_shape[self.axis]
+        if isinstance(self.indices_or_sections, int):
+            if x_size_on_axis is None:
+                x_shape[self.axis] = None
+                return [
+                    KerasTensor(x_shape, dtype=x.dtype)
+                    for _ in range(self.indices_or_sections)
+                ]
+            if np.mod(x_size_on_axis, self.indices_or_sections) != 0:
+                raise ValueError(
+                    "`x` size on given `axis` must be dividible by "
+                    "`indices_or_sections` when `indices_or_sections` is an "
+                    f"int. But received {x_size_on_axis} and "
+                    f"{self.indices_or_sections}."
+                )
+            size = x_size_on_axis // self.indices_or_sections
+            x_shape[self.axis] = size
+            return [
+                KerasTensor(x_shape, dtype=x.dtype)
+                for _ in range(self.indices_or_sections)
+            ]
+
+        indices_or_sections = (0, *self.indices_or_sections, x_size_on_axis)
+        output_size = np.diff(indices_or_sections)
+        outputs = []
+        for i in range(len(output_size)):
+            output_shape = list(x_shape)
+            output_shape[self.axis] = int(output_size[i])
+            outputs.append(KerasTensor(output_shape, dtype=x.dtype))
+        return outputs
+
+
+@keras_export(["keras.ops.split", "keras.ops.numpy.split"])
+def split(x, indices_or_sections, axis=0):
+    """Split a tensor into chunks.
+
+    Args:
+        x: Input tensor.
+        indices_or_sections: If an integer, N, the tensor will be split into N
+            equal sections along `axis`. If a 1-D array of sorted integers,
+            the entries indicate indices at which the tensor will be split
+            along `axis`.
+        axis: Axis along which to split. Defaults to `0`.
+
+    Note:
+        A split does not have to result in equal division when using
+        Torch backend.
+
+    Returns:
+        A list of tensors.
+    """
+    if any_symbolic_tensors((x,)):
+        return Split(indices_or_sections, axis=axis).symbolic_call(x)
+    return backend.numpy.split(x, indices_or_sections, axis=axis)
+
+
+class Stack(Operation):
+    def __init__(self, axis=0):
+        super().__init__()
+        self.axis = axis
+
+    def call(self, xs):
+        return backend.numpy.stack(xs, axis=self.axis)
+
+    def compute_output_spec(self, xs):
+        first_shape = xs[0].shape
+        dtypes_to_resolve = []
+        for x in xs:
+            if not shape_equal(x.shape, first_shape, axis=[], allow_none=True):
+                raise ValueError(
+                    "Every value in `xs` must have the same shape. But found "
+                    f"element of shape {x.shape},  which is different from the "
+                    f"first element's shape {first_shape}."
+                )
+            dtypes_to_resolve.append(getattr(x, "dtype", type(x)))
+
+        size_on_axis = len(xs)
+        output_shape = list(first_shape)
+        if self.axis == -1:
+            output_shape = output_shape + [size_on_axis]
+        elif self.axis >= 0:
+            output_shape.insert(self.axis, size_on_axis)
+        else:
+            output_shape.insert(self.axis + 1, size_on_axis)
+        output_dtype = dtypes.result_type(*dtypes_to_resolve)
+        return KerasTensor(output_shape, dtype=output_dtype)
+
+
+@keras_export(["keras.ops.stack", "keras.ops.numpy.stack"])
+def stack(x, axis=0):
+    """Join a sequence of tensors along a new axis.
+
+    The `axis` parameter specifies the index of the new axis in the
+    dimensions of the result.
+
+    Args:
+        x: A sequence of tensors.
+        axis: Axis along which to stack. Defaults to `0`.
+
+    Returns:
+        The stacked tensor.
+    """
+    if any_symbolic_tensors((x,)):
+        return Stack(axis=axis).symbolic_call(x)
+    return backend.numpy.stack(x, axis=axis)
+
+
+class Std(Operation):
+    def __init__(self, axis=None, keepdims=False):
+        super().__init__()
+        if isinstance(axis, int):
+            self.axis = [axis]
+        else:
+            self.axis = axis
+        self.keepdims = keepdims
+
+    def call(self, x):
+        return backend.numpy.std(x, axis=self.axis, keepdims=self.keepdims)
+
+    def compute_output_spec(self, x):
+        output_dtype = backend.standardize_dtype(x.dtype)
+        if "int" in output_dtype or output_dtype == "bool":
+            output_dtype = backend.floatx()
+        return KerasTensor(
+            reduce_shape(x.shape, axis=self.axis, keepdims=self.keepdims),
+            dtype=output_dtype,
+        )
+
+
+@keras_export(["keras.ops.std", "keras.ops.numpy.std"])
+def std(x, axis=None, keepdims=False):
+    """Compute the standard deviation along the specified axis.
+
+    Args:
+        x: Input tensor.
+        axis: Axis along which to compute standard deviation.
+            Default is to compute the standard deviation of the
+            flattened tensor.
+        keepdims: If this is set to `True`, the axes which are reduced are left
+            in the result as dimensions with size one.
+
+    Returns:
+        Output tensor containing the standard deviation values.
+    """
+    if any_symbolic_tensors((x,)):
+        return Std(axis=axis, keepdims=keepdims).symbolic_call(x)
+    return backend.numpy.std(x, axis=axis, keepdims=keepdims)
+
+
+class Swapaxes(Operation):
+    def __init__(self, axis1, axis2):
+        super().__init__()
+
+        self.axis1 = axis1
+        self.axis2 = axis2
+
+    def call(self, x):
+        return backend.numpy.swapaxes(x, self.axis1, self.axis2)
+
+    def compute_output_spec(self, x):
+        x_shape = list(x.shape)
+        tmp = x_shape[self.axis1]
+        x_shape[self.axis1] = x_shape[self.axis2]
+        x_shape[self.axis2] = tmp
+        return KerasTensor(x_shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.swapaxes", "keras.ops.numpy.swapaxes"])
+def swapaxes(x, axis1, axis2):
+    """Interchange two axes of a tensor.
+
+    Args:
+        x: Input tensor.
+        axis1: First axis.
+        axis2: Second axis.
+
+    Returns:
+        A tensor with the axes swapped.
+    """
+    if any_symbolic_tensors((x,)):
+        return Swapaxes(axis1, axis2).symbolic_call(x)
+    return backend.numpy.swapaxes(x, axis1=axis1, axis2=axis2)
+
+
+class Take(Operation):
+    def __init__(self, axis=None):
+        super().__init__()
+        self.axis = axis
+
+    def call(self, x, indices):
+        return backend.numpy.take(x, indices, axis=self.axis)
+
+    def compute_output_spec(self, x, indices):
+        x_shape = list(x.shape)
+        if isinstance(indices, KerasTensor):
+            indices_shape = list(indices.shape)
+        else:
+            indices_shape = list(getattr(np.array(indices), "shape", []))
+        if self.axis is None:
+            return KerasTensor(indices_shape, dtype=x.dtype)
+
+        # make sure axis is non-negative
+        axis = len(x_shape) + self.axis if self.axis < 0 else self.axis
+        output_shape = x_shape[:axis] + indices_shape + x_shape[axis + 1 :]
+        return KerasTensor(output_shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.take", "keras.ops.numpy.take"])
+def take(x, indices, axis=None):
+    """Take elements from a tensor along an axis.
+
+    Args:
+        x: Source tensor.
+        indices: The indices of the values to extract.
+        axis: The axis over which to select values. By default, the
+            flattened input tensor is used.
+
+    Returns:
+        The corresponding tensor of values.
+    """
+    if any_symbolic_tensors((x, indices)):
+        return Take(axis=axis).symbolic_call(x, indices)
+    return backend.numpy.take(x, indices, axis=axis)
+
+
+class TakeAlongAxis(Operation):
+    def __init__(self, axis=None):
+        super().__init__()
+        self.axis = axis
+
+    def call(self, x, indices):
+        return backend.numpy.take_along_axis(x, indices, axis=self.axis)
+
+    def compute_output_spec(self, x, indices):
+        output_shape = operation_utils.compute_take_along_axis_output_shape(
+            x.shape, indices.shape, self.axis
+        )
+        return KerasTensor(output_shape, dtype=x.dtype)
+
+
+@keras_export(
+    [
+        "keras.ops.take_along_axis",
+        "keras.ops.numpy.take_along_axis",
+    ]
+)
+def take_along_axis(x, indices, axis=None):
+    """Select values from `x` at the 1-D `indices` along the given axis.
+
+    Args:
+        x: Source tensor.
+        indices: The indices of the values to extract.
+        axis: The axis over which to select values. By default, the flattened
+            input tensor is used.
+
+    Returns:
+        The corresponding tensor of values.
+    """
+    if any_symbolic_tensors((x, indices)):
+        return TakeAlongAxis(axis=axis).symbolic_call(x, indices)
+    return backend.numpy.take_along_axis(x, indices, axis=axis)
+
+
+class Tan(Operation):
+    def call(self, x):
+        return backend.numpy.tan(x)
+
+    def compute_output_spec(self, x):
+        dtype = backend.standardize_dtype(getattr(x, "dtype", backend.floatx()))
+        if dtype == "int64":
+            dtype = backend.floatx()
+        else:
+            dtype = dtypes.result_type(dtype, float)
+        sparse = getattr(x, "sparse", False)
+        return KerasTensor(x.shape, dtype=dtype, sparse=sparse)
+
+
+@keras_export(["keras.ops.tan", "keras.ops.numpy.tan"])
+def tan(x):
+    """Compute tangent, element-wise.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        Output tensor of same shape as `x`.
+    """
+    if any_symbolic_tensors((x,)):
+        return Tan().symbolic_call(x)
+    return backend.numpy.tan(x)
+
+
+class Tanh(Operation):
+    def call(self, x):
+        return backend.numpy.tanh(x)
+
+    def compute_output_spec(self, x):
+        dtype = backend.standardize_dtype(getattr(x, "dtype", backend.floatx()))
+        if dtype == "int64":
+            dtype = backend.floatx()
+        else:
+            dtype = dtypes.result_type(dtype, float)
+        sparse = getattr(x, "sparse", False)
+        return KerasTensor(x.shape, dtype=dtype, sparse=sparse)
+
+
+@keras_export(["keras.ops.tanh", "keras.ops.numpy.tanh"])
+def tanh(x):
+    """Hyperbolic tangent, element-wise.
+
+    Arguments:
+        x: Input tensor.
+
+    Returns:
+        Output tensor of same shape as `x`.
+    """
+    if any_symbolic_tensors((x,)):
+        return Tanh().symbolic_call(x)
+    return backend.numpy.tanh(x)
+
+
+class Tensordot(Operation):
+    def __init__(self, axes=2):
+        super().__init__()
+        self.axes = axes
+
+    def call(self, x1, x2):
+        return backend.numpy.tensordot(x1, x2, axes=self.axes)
+
+    def compute_output_spec(self, x1, x2):
+        x1_shape = list(getattr(x1, "shape", []))
+        x2_shape = list(getattr(x2, "shape", []))
+        dtype = dtypes.result_type(
+            getattr(x1, "dtype", type(x1)),
+            getattr(x2, "dtype", type(x2)),
+        )
+        if not isinstance(self.axes, int):
+            x1_select_shape = [x1_shape[ax] for ax in self.axes[0]]
+            x2_select_shape = [x2_shape[ax] for ax in self.axes[1]]
+            if not shape_equal(
+                x1_select_shape, x2_select_shape, allow_none=True
+            ):
+                raise ValueError(
+                    "Shape mismatch on `x1[axes[0]]` and `x2[axes[1]]`, "
+                    f"received {x1_select_shape} and {x2_select_shape}."
+                )
+
+            for ax in self.axes[0]:
+                x1_shape[ax] = -1
+            for ax in self.axes[1]:
+                x2_shape[ax] = -1
+
+            x1_shape = list(filter((-1).__ne__, x1_shape))
+            x2_shape = list(filter((-1).__ne__, x2_shape))
+
+            output_shape = x1_shape + x2_shape
+            return KerasTensor(output_shape, dtype=dtype)
+
+        if self.axes <= 0:
+            output_shape = x1_shape + x2_shape
+        else:
+            output_shape = x1_shape[: -self.axes] + x2_shape[self.axes :]
+
+        return KerasTensor(output_shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.tensordot", "keras.ops.numpy.tensordot"])
+def tensordot(x1, x2, axes=2):
+    """Compute the tensor dot product along specified axes.
+
+    Args:
+        x1: First tensor.
+        x2: Second tensor.
+        axes: - If an integer, N, sum over the last N axes of `x1` and the
+                first N axes of `x2` in order. The sizes of the corresponding
+                axes must match.
+              - Or, a list of axes to be summed over, first sequence applying
+                to `x1`, second to `x2`. Both sequences must be of the
+                same length.
+
+    Returns:
+        The tensor dot product of the inputs.
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return Tensordot(axes=axes).symbolic_call(x1, x2)
+    return backend.numpy.tensordot(x1, x2, axes=axes)
+
+
+class Tile(Operation):
+    def __init__(self, repeats):
+        super().__init__()
+        self.repeats = repeats
+
+    def call(self, x):
+        return backend.numpy.tile(x, self.repeats)
+
+    def compute_output_spec(self, x):
+        x_shape = list(x.shape)
+        repeats = self.repeats
+        if isinstance(repeats, int):
+            repeats = [repeats]
+        if len(x_shape) > len(repeats):
+            repeats = [1] * (len(x_shape) - len(repeats)) + repeats
+        else:
+            x_shape = [1] * (len(repeats) - len(x_shape)) + x_shape
+
+        output_shape = []
+        for x_size, repeat in zip(x_shape, repeats):
+            if x_size is None:
+                output_shape.append(None)
+            else:
+                output_shape.append(x_size * repeat)
+        return KerasTensor(output_shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.tile", "keras.ops.numpy.tile"])
+def tile(x, repeats):
+    """Repeat `x` the number of times given by `repeats`.
+
+    If `repeats` has length `d`, the result will have dimension of
+    `max(d, x.ndim)`.
+
+    If `x.ndim < d`, `x` is promoted to be d-dimensional by prepending
+    new axes.
+
+    If `x.ndim > d`, `repeats` is promoted to `x.ndim` by prepending 1's to it.
+
+    Args:
+        x: Input tensor.
+        repeats: The number of repetitions of `x` along each axis.
+
+    Returns:
+        The tiled output tensor.
+    """
+    if any_symbolic_tensors((x,)):
+        return Tile(
+            repeats,
+        ).symbolic_call(x)
+    return backend.numpy.tile(x, repeats)
+
+
+class Trace(Operation):
+    def __init__(self, offset=0, axis1=0, axis2=1):
+        super().__init__()
+        self.offset = offset
+        self.axis1 = axis1
+        self.axis2 = axis2
+
+    def call(self, x):
+        return backend.numpy.trace(
+            x, offset=self.offset, axis1=self.axis1, axis2=self.axis2
+        )
+
+    def compute_output_spec(self, x):
+        x_shape = list(x.shape)
+        x_shape[self.axis1] = -1
+        x_shape[self.axis2] = -1
+        output_shape = list(filter((-1).__ne__, x_shape))
+        output_dtype = backend.standardize_dtype(x.dtype)
+        if output_dtype not in ("int64", "uint32", "uint64"):
+            output_dtype = dtypes.result_type(output_dtype, "int32")
+        return KerasTensor(output_shape, dtype=output_dtype)
+
+
+@keras_export(["keras.ops.trace", "keras.ops.numpy.trace"])
+def trace(x, offset=0, axis1=0, axis2=1):
+    """Return the sum along diagonals of the tensor.
+
+    If `x` is 2-D, the sum along its diagonal with the given offset is
+    returned, i.e., the sum of elements `x[i, i+offset]` for all `i`.
+
+    If a has more than two dimensions, then the axes specified by `axis1`
+    and `axis2` are used to determine the 2-D sub-arrays whose traces are
+    returned.
+
+    The shape of the resulting tensor is the same as that of `x` with `axis1`
+    and `axis2` removed.
+
+    Args:
+        x: Input tensor.
+        offset: Offset of the diagonal from the main diagonal. Can be
+            both positive and negative. Defaults to `0`.
+        axis1: Axis to be used as the first axis of the 2-D sub-arrays.
+            Defaults to `0`.(first axis).
+        axis2: Axis to be used as the second axis of the 2-D sub-arrays.
+            Defaults to `1` (second axis).
+
+    Returns:
+        If `x` is 2-D, the sum of the diagonal is returned. If `x` has
+        larger dimensions, then a tensor of sums along diagonals is
+        returned.
+    """
+    if any_symbolic_tensors((x,)):
+        return Trace(offset, axis1, axis2).symbolic_call(x)
+    return backend.numpy.trace(x, offset=offset, axis1=axis1, axis2=axis2)
+
+
+class Tri(Operation):
+    def __init__(self, k=0, dtype=None):
+        super().__init__()
+        self.k = k
+        self.dtype = dtype or backend.floatx()
+
+    def call(self, N, M=None):
+        return backend.numpy.tri(N=N, M=M, k=self.k, dtype=self.dtype)
+
+    def compute_output_spec(self, N, M=None):
+        if M is None:
+            M = N
+        return KerasTensor((N, M), dtype=self.dtype)
+
+
+@keras_export(["keras.ops.tri", "keras.ops.numpy.tri"])
+def tri(N, M=None, k=0, dtype=None):
+    """Return a tensor with ones at and below a diagonal and zeros elsewhere.
+
+    Args:
+        N: Number of rows in the tensor.
+        M: Number of columns in the tensor.
+        k: The sub-diagonal at and below which the array is filled.
+            `k = 0` is the main diagonal, while `k < 0` is below it, and
+            `k > 0` is above. The default is 0.
+        dtype: Data type of the returned tensor. The default is "float32".
+
+    Returns:
+        Tensor with its lower triangle filled with ones and zeros elsewhere.
+        `T[i, j] == 1` for `j <= i + k`, 0 otherwise.
+    """
+    return backend.numpy.tri(N, M=M, k=k, dtype=dtype)
+
+
+class Tril(Operation):
+    def __init__(self, k=0):
+        super().__init__()
+        self.k = k
+
+    def call(self, x):
+        return backend.numpy.tril(x, k=self.k)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.tril", "keras.ops.numpy.tril"])
+def tril(x, k=0):
+    """Return lower triangle of a tensor.
+
+    For tensors with `ndim` exceeding 2, `tril` will apply to the
+    final two axes.
+
+    Args:
+        x: Input tensor.
+        k: Diagonal above which to zero elements. Defaults to `0`. the
+            main diagonal. `k < 0` is below it, and `k > 0` is above it.
+
+    Returns:
+        Lower triangle of `x`, of same shape and data type as `x`.
+    """
+    if any_symbolic_tensors((x,)):
+        return Tril(k=k).symbolic_call(x)
+    return backend.numpy.tril(x, k=k)
+
+
+class Triu(Operation):
+    def __init__(self, k=0):
+        super().__init__()
+        self.k = k
+
+    def call(self, x):
+        return backend.numpy.triu(x, k=self.k)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.triu", "keras.ops.numpy.triu"])
+def triu(x, k=0):
+    """Return upper triangle of a tensor.
+
+    For tensors with `ndim` exceeding 2, `triu` will apply to the
+    final two axes.
+
+    Args:
+        x: Input tensor.
+        k: Diagonal below which to zero elements. Defaults to `0`. the
+            main diagonal. `k < 0` is below it, and `k > 0` is above it.
+
+    Returns:
+        Upper triangle of `x`, of same shape and data type as `x`.
+    """
+    if any_symbolic_tensors((x,)):
+        return Triu(k=k).symbolic_call(x)
+    return backend.numpy.triu(x, k=k)
+
+
+class Trunc(Operation):
+    def __init__(self):
+        super().__init__()
+
+    def call(self, x):
+        return backend.numpy.trunc(x)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype=x.dtype)
+
+
+@keras_export(["keras.ops.trunc", "keras.ops.numpy.trunc"])
+def trunc(x):
+    """Return the truncated value of the input, element-wise.
+
+    The truncated value of the scalar `x` is the nearest integer `i` which is
+    closer to zero than `x` is. In short, the fractional part of the signed
+    number `x` is discarded.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        The truncated value of each element in `x`.
+
+    Example:
+    >>> x = ops.array([-1.7, -1.5, -0.2, 0.2, 1.5, 1.7, 2.0])
+    >>> ops.trunc(x)
+    array([-1.0, -1.0, -0.0, 0.0, 1.0, 1.0, 2.0])
+    """
+    if any_symbolic_tensors((x,)):
+        return Trunc().symbolic_call(x)
+    return backend.numpy.trunc(x)
+
+
+class Vdot(Operation):
+    def call(self, x1, x2):
+        return backend.numpy.vdot(x1, x2)
+
+    def compute_output_spec(self, x1, x2):
+        dtype = dtypes.result_type(
+            getattr(x1, "dtype", type(x1)),
+            getattr(x2, "dtype", type(x2)),
+        )
+        return KerasTensor([], dtype=dtype)
+
+
+@keras_export(["keras.ops.vdot", "keras.ops.numpy.vdot"])
+def vdot(x1, x2):
+    """Return the dot product of two vectors.
+
+    If the first argument is complex, the complex conjugate of the first
+    argument is used for the calculation of the dot product.
+
+    Multidimensional tensors are flattened before the dot product is taken.
+
+    Args:
+        x1: First input tensor. If complex, its complex conjugate is taken
+            before calculation of the dot product.
+        x2: Second input tensor.
+
+    Returns:
+        Output tensor.
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return Vdot().symbolic_call(x1, x2)
+    return backend.numpy.vdot(x1, x2)
+
+
+class Inner(Operation):
+    def call(self, x1, x2):
+        return backend.numpy.inner(x1, x2)
+
+    def compute_output_spec(self, x1, x2):
+        dtype = dtypes.result_type(
+            getattr(x1, "dtype", type(x1)),
+            getattr(x2, "dtype", type(x2)),
+        )
+        return KerasTensor([], dtype=dtype)
+
+
+@keras_export(["keras.ops.inner", "keras.ops.numpy.inner"])
+def inner(x1, x2):
+    """Return the inner product of two tensors.
+
+    Ordinary inner product of vectors for 1-D tensors
+    (without complex conjugation), in higher dimensions
+    a sum product over the last axes.
+
+    Multidimensional arrays are treated as vectors by flattening
+    all but their last axes. The resulting dot product is performed
+    over their last axes.
+
+    Args:
+        x1: First input tensor.
+        x2: Second input tensor. The last dimension of `x1` and `x2`
+            must match.
+
+    Returns:
+        Output tensor. The shape of the output is determined by
+        broadcasting the shapes of `x1` and `x2` after removing
+        their last axes.
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return Inner().symbolic_call(x1, x2)
+    return backend.numpy.inner(x1, x2)
+
+
+@keras_export(["keras.ops.vectorize", "keras.ops.numpy.vectorize"])
+def vectorize(pyfunc, *, excluded=None, signature=None):
+    """Turn a function into a vectorized function.
+
+    Example:
+
+    ```python
+    def myfunc(a, b):
+        return a + b
+
+    vfunc = keras.ops.vectorize(myfunc)
+    y = vfunc([1, 2, 3, 4], 2)  # Returns Tensor([3, 4, 5, 6])
+    ```
+
+    Args:
+        pyfunc: Callable of a single tensor argument.
+        excluded: Optional set of integers representing
+            positional arguments for which the function
+            will not be vectorized.
+            These will be passed directly to `pyfunc` unmodified.
+        signature: Optional generalized universal function signature,
+            e.g., `"(m,n),(n)->(m)"` for vectorized
+            matrix-vector multiplication. If provided,
+            `pyfunc` will be called with (and expected to return)
+            arrays with shapes given by the size of corresponding
+            core dimensions. By default, `pyfunc` is assumed
+            to take scalars tensors as input and output.
+
+    Returns:
+        A new function that applies `pyfunc` to every element
+        of its input along axis 0 (the batch axis).
+    """
+    if not callable(pyfunc):
+        raise ValueError(
+            "Expected argument `pyfunc` to be a callable. "
+            f"Received: pyfunc={pyfunc}"
+        )
+    return backend.numpy.vectorize(
+        pyfunc, excluded=excluded, signature=signature
+    )
+
+
+class Vstack(Operation):
+    def call(self, xs):
+        return backend.numpy.vstack(xs)
+
+    def compute_output_spec(self, xs):
+        first_shape = xs[0].shape
+        total_size_on_axis = 0
+        dtypes_to_resolve = []
+        for x in xs:
+            if not shape_equal(x.shape, first_shape, axis=[0], allow_none=True):
+                raise ValueError(
+                    "Every value in `xs` must have the same shape except on "
+                    f"the `axis` dim. But found element of shape {x.shape}, "
+                    f"which is different from the first element's "
+                    f"shape {first_shape}."
+                )
+            if total_size_on_axis is None or x.shape[0] is None:
+                total_size_on_axis = None
+            else:
+                total_size_on_axis += x.shape[0]
+            dtypes_to_resolve.append(getattr(x, "dtype", type(x)))
+        output_shape = list(first_shape)
+        output_shape[0] = total_size_on_axis
+        output_dtype = dtypes.result_type(*dtypes_to_resolve)
+        return KerasTensor(output_shape, output_dtype)
+
+
+@keras_export(["keras.ops.vstack", "keras.ops.numpy.vstack"])
+def vstack(xs):
+    """Stack tensors in sequence vertically (row wise).
+
+    Args:
+        xs: Sequence of tensors.
+
+    Returns:
+        Tensor formed by stacking the given tensors.
+    """
+    if any_symbolic_tensors((xs,)):
+        return Vstack().symbolic_call(xs)
+    return backend.numpy.vstack(xs)
+
+
+class Where(Operation):
+    def call(self, condition, x1=None, x2=None):
+        return backend.numpy.where(condition, x1, x2)
+
+    def compute_output_spec(self, condition, x1, x2):
+        condition_shape = getattr(condition, "shape", [])
+        x1_shape = getattr(x1, "shape", [])
+        x2_shape = getattr(x2, "shape", [])
+        output_shape = broadcast_shapes(condition_shape, x1_shape)
+        output_shape = broadcast_shapes(output_shape, x2_shape)
+        output_dtype = dtypes.result_type(
+            getattr(x1, "dtype", type(x1) if x1 is not None else "int"),
+            getattr(x2, "dtype", type(x2) if x2 is not None else "int"),
+        )
+        return KerasTensor(output_shape, dtype=output_dtype)
+
+
+@keras_export(["keras.ops.where", "keras.ops.numpy.where"])
+def where(condition, x1=None, x2=None):
+    """Return elements chosen from `x1` or `x2` depending on `condition`.
+
+    Args:
+        condition: Where `True`, yield `x1`, otherwise yield `x2`.
+        x1: Values from which to choose when `condition` is `True`.
+        x2: Values from which to choose when `condition` is `False`.
+
+    Returns:
+        A tensor with elements from `x1` where `condition` is `True`, and
+        elements from `x2` where `condition` is `False`.
+    """
+    if (x1 is None and x2 is not None) or (x1 is not None and x2 is None):
+        raise ValueError(
+            "`x1` and `x2` either both should be `None`"
+            " or both should have non-None value."
+        )
+    if any_symbolic_tensors((condition, x1, x2)):
+        return Where().symbolic_call(condition, x1, x2)
+    return backend.numpy.where(condition, x1, x2)
+
+
+class Subtract(Operation):
+    def call(self, x1, x2):
+        return backend.numpy.subtract(x1, x2)
+
+    def compute_output_spec(self, x1, x2):
+        x1_shape = getattr(x1, "shape", [])
+        x2_shape = getattr(x2, "shape", [])
+        output_shape = broadcast_shapes(x1_shape, x2_shape)
+        x1_sparse = getattr(x1, "sparse", False)
+        x2_sparse = getattr(x2, "sparse", False)
+        output_sparse = x1_sparse and x2_sparse
+        dtype = dtypes.result_type(
+            getattr(x1, "dtype", type(x1)),
+            getattr(x2, "dtype", type(x2)),
+        )
+        return KerasTensor(output_shape, dtype=dtype, sparse=output_sparse)
+
+
+@keras_export(["keras.ops.subtract", "keras.ops.numpy.subtract"])
+def subtract(x1, x2):
+    """Subtract arguments element-wise.
+
+    Args:
+        x1: First input tensor.
+        x2: Second input tensor.
+
+    Returns:
+        Output tensor, element-wise difference of `x1` and `x2`.
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return Subtract().symbolic_call(x1, x2)
+    return backend.numpy.subtract(x1, x2)
+
+
+class Multiply(Operation):
+    def call(self, x1, x2):
+        return backend.numpy.multiply(x1, x2)
+
+    def compute_output_spec(self, x1, x2):
+        x1_shape = getattr(x1, "shape", [])
+        x2_shape = getattr(x2, "shape", [])
+        output_shape = broadcast_shapes(x1_shape, x2_shape)
+        x1_sparse = getattr(x1, "sparse", True)
+        x2_sparse = getattr(x2, "sparse", True)
+        output_sparse = x1_sparse or x2_sparse
+        dtype = dtypes.result_type(
+            getattr(x1, "dtype", type(x1)),
+            getattr(x2, "dtype", type(x2)),
+        )
+        return KerasTensor(output_shape, dtype=dtype, sparse=output_sparse)
+
+
+@keras_export(["keras.ops.multiply", "keras.ops.numpy.multiply"])
+def multiply(x1, x2):
+    """Multiply arguments element-wise.
+
+    Args:
+        x1: First input tensor.
+        x2: Second input tensor.
+
+    Returns:
+        Output tensor, element-wise product of `x1` and `x2`.
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return Multiply().symbolic_call(x1, x2)
+    return backend.numpy.multiply(x1, x2)
+
+
+class Divide(Operation):
+    def call(self, x1, x2):
+        return backend.numpy.divide(x1, x2)
+
+    def compute_output_spec(self, x1, x2):
+        x1_shape = getattr(x1, "shape", [])
+        x2_shape = getattr(x2, "shape", [])
+        output_shape = broadcast_shapes(x1_shape, x2_shape)
+        output_dtype = dtypes.result_type(
+            getattr(x1, "dtype", type(x1)),
+            getattr(x2, "dtype", type(x2)),
+            float,
+        )
+        x1_sparse = getattr(x1, "sparse", False)
+        x2_sparse = getattr(x2, "sparse", False)
+        output_sparse = x1_sparse and not x2_sparse
+        return KerasTensor(
+            output_shape, dtype=output_dtype, sparse=output_sparse
+        )
+
+
+@keras_export(["keras.ops.divide", "keras.ops.numpy.divide"])
+def divide(x1, x2):
+    """Divide arguments element-wise.
+
+    `keras.ops.true_divide` is an alias for this function.
+
+    Args:
+        x1: First input tensor.
+        x2: Second input tensor.
+
+    Returns:
+        Output tensor, the quotient `x1/x2`, element-wise.
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return Divide().symbolic_call(x1, x2)
+    return backend.numpy.divide(x1, x2)
+
+
+class DivideNoNan(Operation):
+    def call(self, x1, x2):
+        return backend.numpy.divide_no_nan(x1, x2)
+
+    def compute_output_spec(self, x1, x2):
+        x1_shape = getattr(x1, "shape", [])
+        x2_shape = getattr(x2, "shape", [])
+        output_shape = broadcast_shapes(x1_shape, x2_shape)
+        output_dtype = dtypes.result_type(
+            getattr(x1, "dtype", type(x1)),
+            getattr(x2, "dtype", type(x2)),
+            float,
+        )
+        x1_sparse = getattr(x1, "sparse", False)
+        x2_sparse = getattr(x2, "sparse", False)
+        output_sparse = x1_sparse and not x2_sparse
+        return KerasTensor(
+            output_shape, dtype=output_dtype, sparse=output_sparse
+        )
+
+
+@keras_export(["keras.ops.divide_no_nan", "keras.ops.numpy.divide_no_nan"])
+def divide_no_nan(x1, x2):
+    """Safe element-wise division which returns 0 where the denominator is 0.
+
+    Args:
+        x1: First input tensor.
+        x2: Second input tensor.
+
+    Returns:
+        The quotient `x1/x2`, element-wise, with zero where x2 is zero.
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return DivideNoNan().symbolic_call(x1, x2)
+    return backend.numpy.divide_no_nan(x1, x2)
+
+
+class TrueDivide(Operation):
+    def call(self, x1, x2):
+        return backend.numpy.true_divide(x1, x2)
+
+    def compute_output_spec(self, x1, x2):
+        x1_shape = getattr(x1, "shape", [])
+        x2_shape = getattr(x2, "shape", [])
+        output_shape = broadcast_shapes(x1_shape, x2_shape)
+        output_dtype = dtypes.result_type(
+            getattr(x1, "dtype", type(x1)),
+            getattr(x2, "dtype", type(x2)),
+            float,
+        )
+        x1_sparse = getattr(x1, "sparse", False)
+        x2_sparse = getattr(x2, "sparse", False)
+        output_sparse = x1_sparse and not x2_sparse
+        return KerasTensor(
+            output_shape, dtype=output_dtype, sparse=output_sparse
+        )
+
+
+@keras_export(
+    [
+        "keras.ops.true_divide",
+        "keras.ops.numpy.true_divide",
+    ]
+)
+def true_divide(x1, x2):
+    """Alias for `keras.ops.divide`."""
+    if any_symbolic_tensors((x1, x2)):
+        return TrueDivide().symbolic_call(x1, x2)
+    return backend.numpy.true_divide(x1, x2)
+
+
+class Power(Operation):
+    def call(self, x1, x2):
+        return backend.numpy.power(x1, x2)
+
+    def compute_output_spec(self, x1, x2):
+        x1_shape = getattr(x1, "shape", [])
+        x2_shape = getattr(x2, "shape", [])
+        output_shape = broadcast_shapes(x1_shape, x2_shape)
+        output_dtype = dtypes.result_type(
+            getattr(x1, "dtype", type(x1)), getattr(x2, "dtype", type(x2))
+        )
+        return KerasTensor(output_shape, dtype=output_dtype)
+
+
+@keras_export(["keras.ops.power", "keras.ops.numpy.power"])
+def power(x1, x2):
+    """First tensor elements raised to powers from second tensor, element-wise.
+
+    Args:
+        x1: The bases.
+        x2: The exponents.
+
+    Returns:
+        Output tensor, the bases in `x1` raised to the exponents in `x2`.
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return Power().symbolic_call(x1, x2)
+    return backend.numpy.power(x1, x2)
+
+
+class Negative(Operation):
+    def call(self, x):
+        return backend.numpy.negative(x)
+
+    def compute_output_spec(self, x):
+        sparse = getattr(x, "sparse", False)
+        return KerasTensor(x.shape, dtype=x.dtype, sparse=sparse)
+
+
+@keras_export(["keras.ops.negative", "keras.ops.numpy.negative"])
+def negative(x):
+    """Numerical negative, element-wise.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        Output tensor, `y = -x`.
+    """
+    if any_symbolic_tensors((x,)):
+        return Negative().symbolic_call(x)
+    return backend.numpy.negative(x)
+
+
+class Square(Operation):
+    def call(self, x):
+        return backend.numpy.square(x)
+
+    def compute_output_spec(self, x):
+        sparse = getattr(x, "sparse", False)
+        dtype = backend.standardize_dtype(x.dtype)
+        if dtype == "bool":
+            dtype = "int32"
+        return KerasTensor(x.shape, dtype=dtype, sparse=sparse)
+
+
+@keras_export(["keras.ops.square", "keras.ops.numpy.square"])
+def square(x):
+    """Return the element-wise square of the input.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        Output tensor, the square of `x`.
+    """
+    if any_symbolic_tensors((x,)):
+        return Square().symbolic_call(x)
+    return backend.numpy.square(x)
+
+
+class Sqrt(Operation):
+    def call(self, x):
+        x = backend.convert_to_tensor(x)
+        return backend.numpy.sqrt(x)
+
+    def compute_output_spec(self, x):
+        dtype = (
+            backend.floatx()
+            if backend.standardize_dtype(x.dtype) == "int64"
+            else dtypes.result_type(x.dtype, float)
+        )
+        sparse = getattr(x, "sparse", False)
+        return KerasTensor(x.shape, dtype=dtype, sparse=sparse)
+
+
+@keras_export(["keras.ops.sqrt", "keras.ops.numpy.sqrt"])
+def sqrt(x):
+    """Return the non-negative square root of a tensor, element-wise.
+
+    Args:
+        x: Input tensor.
+
+    Returns:
+        Output tensor, the non-negative square root of `x`.
+    """
+    if any_symbolic_tensors((x,)):
+        return Sqrt().symbolic_call(x)
+    x = backend.convert_to_tensor(x)
+    return backend.numpy.sqrt(x)
+
+
+class Squeeze(Operation):
+    def __init__(self, axis=None):
+        super().__init__()
+        self.axis = axis
+
+    def call(self, x):
+        return backend.numpy.squeeze(x, axis=self.axis)
+
+    def compute_output_spec(self, x):
+        input_shape = list(x.shape)
+        sparse = getattr(x, "sparse", False)
+        axis = to_tuple_or_list(self.axis)
+        if axis is None:
+            output_shape = list(filter((1).__ne__, input_shape))
+            return KerasTensor(output_shape, dtype=x.dtype, sparse=sparse)
+        else:
+            for a in axis:
+                if input_shape[a] != 1:
+                    raise ValueError(
+                        f"Cannot squeeze axis {a}, because the dimension "
+                        "is not 1."
+                    )
+            axis = [canonicalize_axis(a, len(input_shape)) for a in axis]
+            for a in sorted(axis, reverse=True):
+                del input_shape[a]
+            return KerasTensor(input_shape, dtype=x.dtype, sparse=sparse)
+
+
+@keras_export(["keras.ops.squeeze", "keras.ops.numpy.squeeze"])
+def squeeze(x, axis=None):
+    """Remove axes of length one from `x`.
+
+    Args:
+        x: Input tensor.
+        axis: Select a subset of the entries of length one in the shape.
+
+    Returns:
+        The input tensor with all or a subset of the dimensions of
+        length 1 removed.
+    """
+    if any_symbolic_tensors((x,)):
+        return Squeeze(axis=axis).symbolic_call(x)
+    return backend.numpy.squeeze(x, axis=axis)
+
+
+class Transpose(Operation):
+    def __init__(self, axes=None):
+        super().__init__()
+        self.axes = axes
+
+    def call(self, x):
+        return backend.numpy.transpose(x, axes=self.axes)
+
+    def compute_output_spec(self, x):
+        output_shape = operation_utils.compute_transpose_output_shape(
+            x.shape, self.axes
+        )
+        sparse = getattr(x, "sparse", False)
+        return KerasTensor(output_shape, dtype=x.dtype, sparse=sparse)
+
+
+@keras_export(["keras.ops.transpose", "keras.ops.numpy.transpose"])
+def transpose(x, axes=None):
+    """Returns a tensor with `axes` transposed.
+
+    Args:
+        x: Input tensor.
+        axes: Sequence of integers. Permutation of the dimensions of `x`.
+            By default, the order of the axes are reversed.
+
+    Returns:
+        `x` with its axes permuted.
+    """
+    if any_symbolic_tensors((x,)):
+        return Transpose(axes=axes).symbolic_call(x)
+    return backend.numpy.transpose(x, axes=axes)
+
+
+class Mean(Operation):
+    def __init__(self, axis=None, keepdims=False):
+        super().__init__()
+        if isinstance(axis, int):
+            axis = [axis]
+        self.axis = axis
+        self.keepdims = keepdims
+
+    def call(self, x):
+        return backend.numpy.mean(x, axis=self.axis, keepdims=self.keepdims)
+
+    def compute_output_spec(self, x):
+        ori_dtype = backend.standardize_dtype(x.dtype)
+        compute_dtype = dtypes.result_type(x.dtype, "float32")
+        if "int" in ori_dtype or ori_dtype == "bool":
+            result_dtype = compute_dtype
+        else:
+            result_dtype = ori_dtype
+        sparse = getattr(x, "sparse", False)
+        return KerasTensor(
+            reduce_shape(x.shape, axis=self.axis, keepdims=self.keepdims),
+            dtype=result_dtype,
+            sparse=sparse,
+        )
+
+
+@keras_export(["keras.ops.mean", "keras.ops.numpy.mean"])
+def mean(x, axis=None, keepdims=False):
+    """Compute the arithmetic mean along the specified axes.
+
+    Args:
+        x: Input tensor.
+        axis: Axis or axes along which the means are computed. The default
+            is to compute the mean of the flattened tensor.
+        keepdims: If this is set to `True`, the axes which are reduced are left
+            in the result as dimensions with size one.
+
+    Returns:
+        Output tensor containing the mean values.
+    """
+    if any_symbolic_tensors((x,)):
+        return Mean(axis=axis, keepdims=keepdims).symbolic_call(x)
+    return backend.numpy.mean(x, axis=axis, keepdims=keepdims)
+
+
+class Var(Operation):
+    def __init__(self, axis=None, keepdims=False):
+        super().__init__()
+        if isinstance(axis, int):
+            axis = [axis]
+        self.axis = axis
+        self.keepdims = keepdims
+
+    def call(self, x):
+        return backend.numpy.var(x, axis=self.axis, keepdims=self.keepdims)
+
+    def compute_output_spec(self, x):
+        output_dtype = backend.result_type(getattr(x, "dtype", type(x)), float)
+        return KerasTensor(
+            reduce_shape(x.shape, axis=self.axis, keepdims=self.keepdims),
+            dtype=output_dtype,
+        )
+
+
+@keras_export(["keras.ops.var", "keras.ops.numpy.var"])
+def var(x, axis=None, keepdims=False):
+    """Compute the variance along the specified axes.
+
+    Args:
+        x: Input tensor.
+        axis: Axis or axes along which the variance is computed. The default
+            is to compute the variance of the flattened tensor.
+        keepdims: If this is set to `True`, the axes which are reduced are left
+            in the result as dimensions with size one.
+
+    Returns:
+        Output tensor containing the variance.
+    """
+    if any_symbolic_tensors((x,)):
+        return Var(axis=axis, keepdims=keepdims).symbolic_call(x)
+    return backend.numpy.var(x, axis=axis, keepdims=keepdims)
+
+
+class Sum(Operation):
+    def __init__(self, axis=None, keepdims=False):
+        super().__init__()
+        if isinstance(axis, int):
+            axis = [axis]
+        self.axis = axis
+        self.keepdims = keepdims
+
+    def call(self, x):
+        return backend.numpy.sum(x, axis=self.axis, keepdims=self.keepdims)
+
+    def compute_output_spec(self, x):
+        dtype = dtypes.result_type(getattr(x, "dtype", backend.floatx()))
+        # follow jax's rule
+        if dtype in ("bool", "int8", "int16"):
+            dtype = "int32"
+        elif dtype in ("uint8", "uint16"):
+            dtype = "uint32"
+        # TODO: torch doesn't support uint32
+        if backend.backend() == "torch" and dtype == "uint32":
+            dtype = "int32"
+        sparse = getattr(x, "sparse", False)
+        return KerasTensor(
+            reduce_shape(x.shape, axis=self.axis, keepdims=self.keepdims),
+            dtype=dtype,
+            sparse=sparse,
+        )
+
+
+@keras_export(["keras.ops.sum", "keras.ops.numpy.sum"])
+def sum(x, axis=None, keepdims=False):
+    """Sum of a tensor over the given axes.
+
+    Args:
+        x: Input tensor.
+        axis: Axis or axes along which the sum is computed. The default is to
+            compute the sum of the flattened tensor.
+        keepdims: If this is set to `True`, the axes which are reduced are left
+            in the result as dimensions with size one.
+
+    Returns:
+        Output tensor containing the sum.
+    """
+    if any_symbolic_tensors((x,)):
+        return Sum(axis=axis, keepdims=keepdims).symbolic_call(x)
+    return backend.numpy.sum(x, axis=axis, keepdims=keepdims)
+
+
+class Zeros(Operation):
+    def call(self, shape, dtype=None):
+        return backend.numpy.zeros(shape, dtype=dtype)
+
+    def compute_output_spec(self, shape, dtype=None):
+        dtype = dtype or backend.floatx()
+        return KerasTensor(shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.zeros", "keras.ops.numpy.zeros"])
+def zeros(shape, dtype=None):
+    """Return a new tensor of given shape and type, filled with zeros.
+
+    Args:
+        shape: Shape of the new tensor.
+        dtype: Desired data type of the tensor.
+
+    Returns:
+        Tensor of zeros with the given shape and dtype.
+    """
+    return backend.numpy.zeros(shape, dtype=dtype)
+
+
+class Ones(Operation):
+    def call(self, shape, dtype=None):
+        return backend.numpy.ones(shape, dtype=dtype)
+
+    def compute_output_spec(self, shape, dtype=None):
+        dtype = dtype or backend.floatx()
+        return KerasTensor(shape, dtype=dtype)
+
+
+@keras_export(["keras.ops.ones", "keras.ops.numpy.ones"])
+def ones(shape, dtype=None):
+    """Return a new tensor of given shape and type, filled with ones.
+
+    Args:
+        shape: Shape of the new tensor.
+        dtype: Desired data type of the tensor.
+
+    Returns:
+        Tensor of ones with the given shape and dtype.
+    """
+    return backend.numpy.ones(shape, dtype=dtype)
+
+
+class Eye(Operation):
+    def __init__(self, k=0, dtype=None):
+        super().__init__()
+        self.k = k
+        self.dtype = dtype or backend.floatx()
+
+    def call(self, N, M=None):
+        return backend.numpy.eye(N, M=M, k=self.k, dtype=self.dtype)
+
+    def compute_output_spec(self, N, M=None):
+        if M is None:
+            M = N
+        return KerasTensor((N, M), dtype=self.dtype)
+
+
+@keras_export(["keras.ops.eye", "keras.ops.numpy.eye"])
+def eye(N, M=None, k=0, dtype=None):
+    """Return a 2-D tensor with ones on the diagonal and zeros elsewhere.
+
+    Args:
+        N: Number of rows in the output.
+        M: Number of columns in the output. If `None`, defaults to `N`.
+        k: Index of the diagonal: 0 (the default) refers to the main
+            diagonal, a positive value refers to an upper diagonal,
+            and a negative value to a lower diagonal.
+        dtype: Data type of the returned tensor.
+
+    Returns:
+        Tensor with ones on the k-th diagonal and zeros elsewhere.
+    """
+    return backend.numpy.eye(N, M=M, k=k, dtype=dtype)
+
+
+class FloorDivide(Operation):
+    def call(self, x1, x2):
+        return backend.numpy.floor_divide(x1, x2)
+
+    def compute_output_spec(self, x1, x2):
+        x1_shape = getattr(x1, "shape", [])
+        x2_shape = getattr(x2, "shape", [])
+        output_shape = broadcast_shapes(x1_shape, x2_shape)
+        output_dtype = dtypes.result_type(
+            getattr(x1, "dtype", type(x1)),
+            getattr(x2, "dtype", type(x2)),
+        )
+        return KerasTensor(output_shape, dtype=output_dtype)
+
+
+@keras_export(["keras.ops.floor_divide", "keras.ops.numpy.floor_divide"])
+def floor_divide(x1, x2):
+    """Returns the largest integer smaller or equal to the division of inputs.
+
+    Args:
+        x1: Numerator.
+        x2: Denominator.
+
+    Returns:
+        Output tensor, `y = floor(x1/x2)`
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return FloorDivide().symbolic_call(x1, x2)
+    return backend.numpy.floor_divide(x1, x2)
+
+
+class LogicalXor(Operation):
+    def call(self, x1, x2):
+        return backend.numpy.logical_xor(x1, x2)
+
+    def compute_output_spec(self, x1, x2):
+        x1_shape = getattr(x1, "shape", [])
+        x2_shape = getattr(x2, "shape", [])
+        output_shape = broadcast_shapes(x1_shape, x2_shape)
+        return KerasTensor(output_shape, dtype="bool")
+
+
+@keras_export(["keras.ops.logical_xor", "keras.ops.numpy.logical_xor"])
+def logical_xor(x1, x2):
+    """Compute the truth value of `x1 XOR x2`, element-wise.
+
+    Args:
+        x1: First input tensor.
+        x2: Second input tensor.
+
+    Returns:
+        Output boolean tensor.
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return LogicalXor().symbolic_call(x1, x2)
+    return backend.numpy.logical_xor(x1, x2)
+
+
+class Correlate(Operation):
+    def __init__(self, mode="valid"):
+        super().__init__()
+        self.mode = mode
+
+    def call(self, x1, x2):
+        return backend.numpy.correlate(x1, x2, mode=self.mode)
+
+    def compute_output_spec(self, x1, x2):
+        x1_shape = getattr(x1, "shape", [])
+        x2_shape = getattr(x2, "shape", [])
+        if len(x1_shape) != 1:
+            raise ValueError(
+                "`x1` must be a 1-dimensional tensor, but received"
+                + f"shape {x1_shape}"
+            )
+        if len(x2_shape) != 1:
+            raise ValueError(
+                "`x2` must be a 1-dimensional tensor, but received"
+                + f"shape {x2_shape}"
+            )
+        x1_len, x2_len = x1_shape[0], x2_shape[0]
+        output_shape = (
+            np.maximum(x1_len, x2_len) - np.minimum(x1_len, x2_len) + 1,
+        )
+        if self.mode == "same":
+            output_shape = (np.maximum(x1_len, x2_len),)
+        elif self.mode == "full":
+            output_shape = (x1_len + x2_len - 1,)
+        if self.mode not in ("valid", "same", "full"):
+            raise ValueError(
+                "`mode` must be either `valid`, `same`, or `full`, but"
+                f"received: {self.mode}"
+            )
+        output_dtype = dtypes.result_type(
+            getattr(x1, "dtype", type(x1)),
+            getattr(x2, "dtype", type(x2)),
+        )
+        if output_dtype == "int64":
+            output_dtype = "float64"
+        elif output_dtype not in ["bfloat16", "float16", "float64"]:
+            output_dtype = "float32"
+        return KerasTensor(output_shape, dtype=output_dtype)
+
+
+@keras_export(["keras.ops.correlate", "keras.ops.numpy.correlate"])
+def correlate(x1, x2, mode="valid"):
+    """Compute the cross-correlation of two 1-dimensional tensors.
+
+    Args:
+        x1: First 1-dimensional input tensor of length M.
+        x2: Second 1-dimensional input tensor of length N.
+        mode: Either `valid`, `same` or `full`.
+            By default the mode is set to `valid`, which returns
+            an output of length max(M, N) - min(M, N) + 1.
+            `same` returns an output of length max(M, N).
+            `full` mode returns the convolution at each point of
+            overlap, with an output length of N+M-1
+
+    Returns:
+        Output tensor, cross-correlation of `x1` and `x2`.
+    """
+    if any_symbolic_tensors((x1, x2)):
+        return Correlate(mode=mode).symbolic_call(x1, x2)
+    return backend.numpy.correlate(x1, x2, mode=mode)
+
+
+class Select(Operation):
+    def __init__(self):
+        super().__init__()
+
+    def call(self, condlist, choicelist, default=0):
+        return backend.numpy.select(condlist, choicelist, default)
+
+    def compute_output_spec(self, condlist, choicelist, default=0):
+        first_element = choicelist[0]
+        return KerasTensor(first_element.shape, dtype=first_element.dtype)
+
+
+@keras_export(["keras.ops.select", "keras.ops.numpy.select"])
+def select(condlist, choicelist, default=0):
+    """Return elements from `choicelist`, based on conditions in `condlist`.
+
+    Args:
+        condlist: List of boolean tensors.
+            The list of conditions which determine from which array
+            in choicelist the output elements are taken.
+            When multiple conditions are satisfied,
+            the first one encountered in condlist is used.
+        choicelist: List of tensors.
+            The list of tensors from which the output elements are taken.
+            This list has to be of the same length as `condlist`.
+        defaults: Optional scalar value.
+            The element inserted in the output
+            when all conditions evaluate to `False`.
+
+    Returns:
+        Tensor where the output at position `m` is the `m`-th element
+        of the tensor in `choicelist` where the `m`-th element of the
+        corresponding tensor in `condlist` is `True`.
+
+    Example:
+
+    ```python
+    from keras import ops
+
+    x = ops.arange(6)
+    condlist = [x<3, x>3]
+    choicelist = [x, x**2]
+    ops.select(condlist, choicelist, 42)
+    # Returns: tensor([0,  1,  2, 42, 16, 25])
+    ```
+    """
+    if not isinstance(condlist, (list, tuple)) or not isinstance(
+        choicelist, (list, tuple)
+    ):
+        raise ValueError(
+            "condlist and choicelist must be lists. Received: "
+            f"type(condlist) = {type(condlist)}, "
+            f"type(choicelist) = {type(choicelist)}"
+        )
+    condlist = list(condlist)
+    choicelist = list(choicelist)
+    if not condlist or not choicelist:
+        raise ValueError(
+            "condlist and choicelist must not be empty. Received: "
+            f"condlist = {condlist}, "
+            f"choicelist = {choicelist}"
+        )
+    if any_symbolic_tensors(condlist + choicelist + [default]):
+        return Select().symbolic_call(condlist, choicelist, default)
+    return backend.numpy.select(condlist, choicelist, default)
+
+
+class Slogdet(Operation):
+    def __init__(self):
+        super().__init__()
+
+    def call(self, x):
+        return backend.numpy.slogdet(x)
+
+    def compute_output_spec(self, x):
+        sign = KerasTensor((), dtype=x.dtype)
+        logabsdet = KerasTensor(x.shape[:-2], dtype=x.dtype)
+        return (sign, logabsdet)
+
+
+@keras_export(["keras.ops.slogdet", "keras.ops.numpy.slogdet"])
+def slogdet(x):
+    """Compute the sign and natural logarithm of the determinant of a matrix.
+
+    Args:
+        x: Input matrix. It must 2D and square.
+
+    Returns:
+        A tuple `(sign, logabsdet)`. `sign` is a number representing
+        the sign of the determinant. For a real matrix, this is 1, 0, or -1.
+        For a complex matrix, this is a complex number with absolute value 1
+        (i.e., it is on the unit circle), or else 0.
+        `logabsdet` is the natural log of the absolute value of the determinant.
+    """
+    if any_symbolic_tensors((x,)):
+        return Slogdet().symbolic_call(x)
+    return backend.numpy.slogdet(x)
+
+
+class Argpartition(Operation):
+    def __init__(self, kth, axis=-1):
+        super().__init__()
+        if not isinstance(kth, int):
+            raise ValueError("kth must be an integer. Received:" f"kth = {kth}")
+        self.kth = kth
+        self.axis = axis
+
+    def call(self, x):
+        return backend.numpy.argpartition(x, kth=self.kth, axis=self.axis)
+
+    def compute_output_spec(self, x):
+        return KerasTensor(x.shape, dtype="int32")
+
+
+@keras_export(["keras.ops.argpartition", "keras.ops.numpy.argpartition"])
+def argpartition(x, kth, axis=-1):
+    """Performs an indirect partition along the given axis.
+
+    It returns an array
+    of indices of the same shape as `x` that index data along the given axis
+    in partitioned order.
+
+    Args:
+        a: Array to sort.
+        kth: Element index to partition by.
+            The k-th element will be in its final sorted position and all
+            smaller elements will be moved before it and all larger elements
+            behind it. The order of all elements in the partitions is undefined.
+            If provided with a sequence of k-th it will partition all of them
+            into their sorted position at once.
+        axis: Axis along which to sort. The default is -1 (the last axis).
+            If `None`, the flattened array is used.
+
+    Returns:
+        Array of indices that partition `x` along the specified `axis`.
+    """
+    if any_symbolic_tensors((x,)):
+        return Argpartition(kth, axis).symbolic_call(x)
+    return backend.numpy.argpartition(x, kth, axis)
+
+
+class Histogram(Operation):
+    def __init__(self, bins=10, range=None):
+        super().__init__()
+
+        if not isinstance(bins, int):
+            raise TypeError("bins must be of type `int`")
+        if bins < 0:
+            raise ValueError("`bins` should be a non-negative integer")
+
+        if range:
+            if len(range) < 2 or not isinstance(range, tuple):
+                raise ValueError("range must be a tuple of two elements")
+
+            if range[1] < range[0]:
+                raise ValueError(
+                    "The second element of range must be greater than the first"
+                )
+
+        self.bins = bins
+        self.range = range
+
+    def call(self, x):
+        x = backend.convert_to_tensor(x)
+        if len(x.shape) > 1:
+            raise ValueError("Input tensor must be 1-dimensional")
+        return backend.math.histogram(x, bins=self.bins, range=self.range)
+
+    def compute_output_spec(self, x):
+        return (
+            KerasTensor(shape=(self.bins,), dtype=x.dtype),
+            KerasTensor(shape=(self.bins + 1,), dtype=x.dtype),
+        )
+
+
+@keras_export(["keras.ops.histogram", "keras.ops.numpy.histogram"])
+def histogram(x, bins=10, range=None):
+    """Computes a histogram of the data tensor `x`.
+
+    Args:
+        x: Input tensor.
+        bins: An integer representing the number of histogram bins.
+            Defaults to 10.
+        range: A tuple representing the lower and upper range of the bins.
+            If not specified, it will use the min and max of `x`.
+
+    Returns:
+        A tuple containing:
+        - A tensor representing the counts of elements in each bin.
+        - A tensor representing the bin edges.
+
+    Example:
+
+    ```
+    >>> input_tensor = np.random.rand(8)
+    >>> keras.ops.histogram(input_tensor)
+    (array([1, 1, 1, 0, 0, 1, 2, 1, 0, 1], dtype=int32),
+    array([0.0189519 , 0.10294958, 0.18694726, 0.27094494, 0.35494262,
+        0.43894029, 0.52293797, 0.60693565, 0.69093333, 0.77493101,
+        0.85892869]))
+    ```
+    """
+    if not isinstance(bins, int):
+        raise TypeError(
+            f"Argument `bins` must be of type `int`. Received: bins={bins}"
+        )
+    if bins < 0:
+        raise ValueError(
+            "Argument `bins` should be a non-negative integer. "
+            f"Received: bins={bins}"
+        )
+
+    if range:
+        if len(range) < 2 or not isinstance(range, tuple):
+            raise ValueError(
+                "Argument `range` must be a tuple of two elements. "
+                f"Received: range={range}"
+            )
+
+        if range[1] < range[0]:
+            raise ValueError(
+                "The second element of `range` must be greater than the first. "
+                f"Received: range={range}"
+            )
+
+    if any_symbolic_tensors((x,)):
+        return Histogram(bins=bins, range=range).symbolic_call(x)
+
+    x = backend.convert_to_tensor(x)
+    if len(x.shape) > 1:
+        raise ValueError(
+            "Input tensor must be 1-dimensional. "
+            f"Received: input.shape={x.shape}"
+        )
+    return backend.numpy.histogram(x, bins=bins, range=range)
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/operation.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/operation.py
new file mode 100644
index 0000000000000000000000000000000000000000..a289bc5f321362824688a92b1a371479852fc259
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/operation.py
@@ -0,0 +1,316 @@
+import inspect
+import textwrap
+
+from keras.src import backend
+from keras.src import dtype_policies
+from keras.src import tree
+from keras.src.api_export import keras_export
+from keras.src.backend.common.keras_tensor import any_symbolic_tensors
+from keras.src.ops.node import Node
+from keras.src.utils import python_utils
+from keras.src.utils import traceback_utils
+from keras.src.utils.naming import auto_name
+
+
+@keras_export("keras.Operation")
+class Operation:
+    def __init__(self, dtype=None, name=None):
+        if name is None:
+            name = auto_name(self.__class__.__name__)
+        if not isinstance(name, str) or "/" in name:
+            raise ValueError(
+                "Argument `name` must be a string and "
+                "cannot contain character `/`. "
+                f"Received: name={name} (of type {type(name)})"
+            )
+        self._dtype_policy = dtype_policies.get(dtype)
+        self.name = name
+        self._inbound_nodes = []
+        self._outbound_nodes = []
+
+    @traceback_utils.filter_traceback
+    def __call__(self, *args, **kwargs):
+        if traceback_utils.is_traceback_filtering_enabled():
+            # Wrap self.call to provide helpful info in case of exception
+            if any_symbolic_tensors(args, kwargs):
+                call_fn = self.symbolic_call
+            else:
+                if getattr(self, "quantization_mode", None) is not None:
+                    call_fn = self.quantized_call
+                else:
+                    call_fn = self.call
+            call_fn = traceback_utils.inject_argument_info_in_traceback(
+                call_fn,
+                object_name=(f"{self.__class__.__name__}.call()"),
+            )
+            return call_fn(*args, **kwargs)
+
+        # Plain flow.
+        if any_symbolic_tensors(args, kwargs):
+            return self.symbolic_call(*args, **kwargs)
+        if getattr(self, "quantization_mode", None) is not None:
+            return self.quantized_call(*args, **kwargs)
+        else:
+            return self.call(*args, **kwargs)
+
+    def symbolic_call(self, *args, **kwargs):
+        # Perform shape/dtype inference.
+        outputs = self.compute_output_spec(*args, **kwargs)
+        # Record a new node in the operations graph.
+        # The Node wires itself to inbound and outbound ops.  The
+        # Node constructor updates this op's self._inbound_nodes,
+        # sets _keras_history on the outputs, and adds itself to the
+        # `_outbound_nodes` of the ops that produced the inputs to this
+        # call.
+        Node(
+            operation=self, call_args=args, call_kwargs=kwargs, outputs=outputs
+        )
+        return outputs
+
+    def call(self, *args, **kwargs):
+        raise NotImplementedError
+
+    def quantized_call(self, *args, **kwargs):
+        raise NotImplementedError
+
+    def compute_output_spec(self, *args, **kwargs):
+        try:
+            return backend.compute_output_spec(self.call, *args, **kwargs)
+        except Exception as e:
+            new_e = e.__class__(
+                "Could not automatically infer the output shape / dtype of "
+                f"'{self.name}' (of type {self.__class__.__name__}). "
+                f"Either the `{self.__class__.__name__}.call()` method "
+                f"is incorrect, or you need to implement the "
+                f"`{self.__class__.__name__}.compute_output_spec() / "
+                "compute_output_shape()` method. "
+                f"Error encountered:\n\n{e}"
+            )
+            raise new_e.with_traceback(e.__traceback__) from None
+
+    def __new__(cls, *args, **kwargs):
+        """We override __new__ to saving serializable constructor arguments.
+
+        These arguments are used to auto-generate an object serialization
+        config, which enables user-created subclasses to be serializable
+        out of the box in most cases without forcing the user
+        to manually implement `get_config()`.
+        """
+        instance = super(Operation, cls).__new__(cls)
+
+        # Generate a config to be returned by default by `get_config()`.
+        arg_names = inspect.getfullargspec(cls.__init__).args
+        kwargs.update(dict(zip(arg_names[1 : len(args) + 1], args)))
+
+        # Explicitly serialize `dtype` to support auto_config
+        dtype = kwargs.get("dtype", None)
+        if dtype is not None and isinstance(dtype, dtype_policies.DTypePolicy):
+            # For backward compatibility, we use a str (`name`) for
+            # `DTypePolicy`
+            if dtype.quantization_mode is None:
+                kwargs["dtype"] = dtype.name
+            # Otherwise, use `dtype_policies.serialize`
+            else:
+                kwargs["dtype"] = dtype_policies.serialize(dtype)
+
+        # For safety, we only rely on auto-configs for a small set of
+        # serializable types.
+        supported_types = (str, int, float, bool, type(None))
+        try:
+            flat_arg_values = tree.flatten(kwargs)
+            auto_config = True
+            for value in flat_arg_values:
+                if not isinstance(value, supported_types):
+                    auto_config = False
+                    break
+        except TypeError:
+            auto_config = False
+        try:
+            instance._lock = False
+            if auto_config:
+                from keras.src.saving import serialization_lib
+
+                instance._auto_config = serialization_lib.SerializableDict(
+                    **kwargs
+                )
+            else:
+                instance._auto_config = None
+            instance._lock = True
+        except RecursionError:
+            # Setting an instance attribute in __new__ has the potential
+            # to trigger an infinite recursion if a subclass overrides
+            # setattr in an unsafe way.
+            pass
+        return instance
+
+    @python_utils.default
+    def get_config(self):
+        """Returns the config of the object.
+
+        An object config is a Python dictionary (serializable)
+        containing the information needed to re-instantiate it.
+        """
+        config = {
+            "name": self.name,
+        }
+
+        if not python_utils.is_default(self.get_config):
+            # In this case the subclass implements get_config()
+            return config
+
+        # In this case the subclass doesn't implement get_config():
+        # Let's see if we can autogenerate it.
+        if getattr(self, "_auto_config", None) is not None:
+            xtra_args = set(config.keys())
+            config.update(self._auto_config.config)
+            # Remove args non explicitly supported
+            argspec = inspect.getfullargspec(self.__init__)
+            if argspec.varkw != "kwargs":
+                for key in xtra_args - xtra_args.intersection(argspec.args[1:]):
+                    config.pop(key, None)
+            return config
+        else:
+            raise NotImplementedError(
+                textwrap.dedent(
+                    f"""
+        Object {self.__class__.__name__} was created by passing
+        non-serializable argument values in `__init__()`,
+        and therefore the object must override `get_config()` in
+        order to be serializable. Please implement `get_config()`.
+
+        Example:
+
+        class CustomLayer(keras.layers.Layer):
+            def __init__(self, arg1, arg2, **kwargs):
+                super().__init__(**kwargs)
+                self.arg1 = arg1
+                self.arg2 = arg2
+
+            def get_config(self):
+                config = super().get_config()
+                config.update({{
+                    "arg1": self.arg1,
+                    "arg2": self.arg2,
+                }})
+                return config"""
+                )
+            )
+
+    @classmethod
+    def from_config(cls, config):
+        """Creates an operation from its config.
+
+        This method is the reverse of `get_config`, capable of instantiating the
+        same operation from the config dictionary.
+
+        Note: If you override this method, you might receive a serialized dtype
+        config, which is a `dict`. You can deserialize it as follows:
+
+        ```python
+        if "dtype" in config and isinstance(config["dtype"], dict):
+            policy = dtype_policies.deserialize(config["dtype"])
+        ```
+
+        Args:
+            config: A Python dictionary, typically the output of `get_config`.
+
+        Returns:
+            An operation instance.
+        """
+        # Explicitly deserialize dtype config if needed. This enables users to
+        # directly interact with the instance of `DTypePolicy`.
+        if "dtype" in config and isinstance(config["dtype"], dict):
+            config = config.copy()
+            policy = dtype_policies.deserialize(config["dtype"])
+            if (
+                not isinstance(policy, dtype_policies.DTypePolicyMap)
+                and policy.quantization_mode is None
+            ):
+                # For backward compatibility, we use a str (`name`) for
+                # `DTypePolicy`
+                policy = policy.name
+            config["dtype"] = policy
+        try:
+            return cls(**config)
+        except Exception as e:
+            raise TypeError(
+                f"Error when deserializing class '{cls.__name__}' using "
+                f"config={config}.\n\nException encountered: {e}"
+            )
+
+    def __repr__(self):
+        return f"<Operation name={self.name}>"
+
+    @property
+    def input(self):
+        """Retrieves the input tensor(s) of a symbolic operation.
+
+        Only returns the tensor(s) corresponding to the *first time*
+        the operation was called.
+
+        Returns:
+            Input tensor or list of input tensors.
+        """
+        return self._get_node_attribute_at_index(0, "input_tensors", "input")
+
+    @property
+    def output(self):
+        """Retrieves the output tensor(s) of a layer.
+
+        Only returns the tensor(s) corresponding to the *first time*
+        the operation was called.
+
+        Returns:
+            Output tensor or list of output tensors.
+        """
+        return self._get_node_attribute_at_index(0, "output_tensors", "output")
+
+    def _get_node_attribute_at_index(self, node_index, attr, attr_name):
+        """Private utility to retrieves an attribute (e.g. inputs) from a node.
+
+        This is used to implement the properties:
+        - output
+        - input
+
+        Args:
+            node_index: Integer index of the node from which
+                to retrieve the attribute.
+            attr: Exact node attribute name.
+            attr_name: Human-readable attribute name, for error messages.
+
+        Returns:
+            The operation's attribute `attr` at the node of index `node_index`.
+        """
+        if not self._inbound_nodes:
+            raise AttributeError(
+                f"The layer {self.name} has never been called "
+                f"and thus has no defined {attr_name}."
+            )
+        if not len(self._inbound_nodes) > node_index:
+            raise ValueError(
+                f"Asked to get {attr_name} at node "
+                f"{node_index}, but the operation has only "
+                f"{len(self._inbound_nodes)} inbound nodes."
+            )
+        values = getattr(self._inbound_nodes[node_index], attr)
+        if isinstance(values, list) and len(values) == 1:
+            return values[0]
+        else:
+            return values
+
+    # Hooks for backend layer classes
+    def _post_build(self):
+        """Can be overridden for per backend post build actions."""
+        pass
+
+    def _setattr_hook(self, name, value):
+        """Can be overridden for per backend post build actions."""
+        return name, value
+
+    def _post_track_variable(self, variable):
+        """Can be overridden for per backend post track actions."""
+        pass
+
+    def _post_untrack_variable(self, variable):
+        """Can be overridden for per backend post untrack actions."""
+        pass
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/operation_utils.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/operation_utils.py
new file mode 100644
index 0000000000000000000000000000000000000000..f5ca1857c039bcd535bed2e83c742bd6abcc3c4b
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/operation_utils.py
@@ -0,0 +1,421 @@
+import math
+
+import numpy as np
+
+from keras.src import tree
+from keras.src.api_export import keras_export
+from keras.src.backend.common.backend_utils import canonicalize_axis
+from keras.src.backend.common.backend_utils import to_tuple_or_list
+
+
+def broadcast_shapes(shape1, shape2):
+    """Broadcast input shapes to a unified shape.
+
+    Convert to list for mutability.
+
+    Args:
+        shape1: A tuple or list of integers.
+        shape2: A tuple or list of integers.
+
+    Returns:
+        output_shape (list of integers or `None`): The broadcasted shape.
+
+    Example:
+    >>> broadcast_shapes((5, 3), (1, 3))
+    [5, 3]
+    """
+    shape1 = list(shape1)
+    shape2 = list(shape2)
+    origin_shape1 = shape1
+    origin_shape2 = shape2
+
+    if len(shape1) > len(shape2):
+        shape2 = [1] * (len(shape1) - len(shape2)) + shape2
+    if len(shape1) < len(shape2):
+        shape1 = [1] * (len(shape2) - len(shape1)) + shape1
+    output_shape = list(shape1)
+    for i in range(len(shape1)):
+        if shape1[i] == 1:
+            output_shape[i] = shape2[i]
+        elif shape1[i] is None:
+            output_shape[i] = None if shape2[i] == 1 else shape2[i]
+        else:
+            if shape2[i] == 1 or shape2[i] is None or shape2[i] == shape1[i]:
+                output_shape[i] = shape1[i]
+            else:
+                raise ValueError(
+                    "Cannot broadcast shape, the failure dim has value "
+                    f"{shape1[i]}, which cannot be broadcasted to {shape2[i]}. "
+                    f"Input shapes are: {origin_shape1} and {origin_shape2}."
+                )
+
+    return output_shape
+
+
+def compute_expand_dims_output_shape(input_shape, axis):
+    """Compute the output shape for the `expand_dims` operation.
+
+    Args:
+        input_shape: Input shape.
+        axis: int or sequence of ints for the axis to expand.
+
+    Returns:
+        Tuple of ints: The output shape after the `expand_dims` operation.
+    """
+    input_shape = list(input_shape)
+    if axis is None:
+        axis = len(input_shape)
+    axis = to_tuple_or_list(axis)
+    out_ndim = len(axis) + len(input_shape)
+    axis = [canonicalize_axis(a, out_ndim) for a in axis]
+    shape_iter = iter(input_shape)
+    new_shape = [
+        1 if ax in axis else next(shape_iter) for ax in range(out_ndim)
+    ]
+    return tuple(new_shape)
+
+
+def compute_pooling_output_shape(
+    input_shape,
+    pool_size,
+    strides,
+    padding="valid",
+    data_format="channels_last",
+):
+    """Computes the output shape of pooling operations.
+
+    Args:
+        input_shape: Input shape. Must be a tuple of integers.
+        pool_size: Size of the pooling operation. Must be a tuple of integers.
+        strides: Stride of the pooling operation. Must be a tuple of integers.
+            Defaults to `pool_size`.
+        padding: Padding method. Available methods are `"valid"` or `"same"`.
+            Defaults to `"valid"`.
+        data_format: String, either `"channels_last"` or `"channels_first"`.
+            The ordering of the dimensions in the inputs. `"channels_last"`
+            corresponds to inputs with shape `(batch, height, width, channels)`
+            while `"channels_first"` corresponds to inputs with shape
+            `(batch, channels, height, weight)`. Defaults to `"channels_last"`.
+
+    Returns:
+        Tuple of ints: The output shape of the pooling operation.
+
+    Examples:
+
+    # Basic usage with square pooling on a single image
+    >>> compute_pooling_output_shape((1, 4, 4, 1), (2, 2))
+    (1, 2, 2, 1)
+
+    # Strided pooling on a single image with strides different from pool_size
+    >>> compute_pooling_output_shape((1, 4, 4, 1), (2, 2), strides=(1, 1))
+    (1, 3, 3, 1)
+
+    # Pooling on a batch of images
+    >>> compute_pooling_output_shape((32, 4, 4, 3), (2, 2))
+    (32, 2, 2, 3)
+    """
+    strides = pool_size if strides is None else strides
+    input_shape_origin = list(input_shape)
+    input_shape = np.array(input_shape)
+    if data_format == "channels_last":
+        spatial_shape = input_shape[1:-1]
+    else:
+        spatial_shape = input_shape[2:]
+    none_dims = []
+    for i in range(len(spatial_shape)):
+        if spatial_shape[i] is None:
+            # Set `None` shape to a manual value so that we can run numpy
+            # computation on `spatial_shape`.
+            spatial_shape[i] = -1
+            none_dims.append(i)
+    pool_size = np.array(pool_size)
+    if padding == "valid":
+        output_spatial_shape = (
+            np.floor((spatial_shape - pool_size) / strides) + 1
+        )
+        for i in range(len(output_spatial_shape)):
+            if i not in none_dims and output_spatial_shape[i] < 0:
+                raise ValueError(
+                    "Computed output size would be negative. Received: "
+                    f"`inputs.shape={input_shape}` and `pool_size={pool_size}`."
+                )
+    elif padding == "same":
+        output_spatial_shape = np.floor((spatial_shape - 1) / strides) + 1
+    else:
+        raise ValueError(
+            "Argument `padding` must be either 'valid' or 'same'. Received: "
+            f"padding={padding}"
+        )
+    output_spatial_shape = [int(i) for i in output_spatial_shape]
+    for i in none_dims:
+        output_spatial_shape[i] = None
+    output_spatial_shape = tuple(output_spatial_shape)
+    if data_format == "channels_last":
+        output_shape = (
+            (input_shape_origin[0],)
+            + output_spatial_shape
+            + (input_shape_origin[-1],)
+        )
+    else:
+        output_shape = (
+            input_shape_origin[0],
+            input_shape_origin[1],
+        ) + output_spatial_shape
+    return output_shape
+
+
+def compute_conv_output_shape(
+    input_shape,
+    filters,
+    kernel_size,
+    strides=1,
+    padding="valid",
+    data_format="channels_last",
+    dilation_rate=1,
+):
+    """Compute the output shape of conv ops."""
+    if data_format == "channels_last":
+        spatial_shape = input_shape[1:-1]
+        kernel_shape = kernel_size + (input_shape[-1], filters)
+    else:
+        spatial_shape = input_shape[2:]
+        kernel_shape = kernel_size + (input_shape[1], filters)
+    if len(kernel_shape) != len(input_shape):
+        raise ValueError(
+            "Kernel shape must have the same length as input, but received "
+            f"kernel of shape {kernel_shape} and "
+            f"input of shape {input_shape}."
+        )
+    if isinstance(dilation_rate, int):
+        dilation_rate = (dilation_rate,) * len(spatial_shape)
+    if isinstance(strides, int):
+        strides = (strides,) * len(spatial_shape)
+    if len(dilation_rate) != len(spatial_shape):
+        raise ValueError(
+            "Dilation must be None, scalar or tuple/list of length of "
+            "inputs' spatial shape, but received "
+            f"`dilation_rate={dilation_rate}` and "
+            f"input of shape {input_shape}."
+        )
+    none_dims = []
+    spatial_shape = np.array(spatial_shape)
+    for i in range(len(spatial_shape)):
+        if spatial_shape[i] is None:
+            # Set `None` shape to a manual value so that we can run numpy
+            # computation on `spatial_shape`.
+            spatial_shape[i] = -1
+            none_dims.append(i)
+
+    kernel_spatial_shape = np.array(kernel_shape[:-2])
+    dilation_rate = np.array(dilation_rate)
+    if padding == "valid":
+        output_spatial_shape = (
+            np.floor(
+                (spatial_shape - dilation_rate * (kernel_spatial_shape - 1) - 1)
+                / strides
+            )
+            + 1
+        )
+        for i in range(len(output_spatial_shape)):
+            if i not in none_dims and output_spatial_shape[i] < 0:
+                raise ValueError(
+                    "Computed output size would be negative. Received "
+                    f"`inputs shape={input_shape}`, "
+                    f"`kernel shape={kernel_shape}`, "
+                    f"`dilation_rate={dilation_rate}`."
+                )
+    elif padding == "same" or padding == "causal":
+        output_spatial_shape = np.floor((spatial_shape - 1) / strides) + 1
+    else:
+        raise ValueError(
+            "`padding` must be either `'valid'` or `'same'`. Received "
+            f"{padding}."
+        )
+    output_spatial_shape = [int(i) for i in output_spatial_shape]
+    for i in none_dims:
+        output_spatial_shape[i] = None
+    output_spatial_shape = tuple(output_spatial_shape)
+    if data_format == "channels_last":
+        output_shape = (
+            (input_shape[0],) + output_spatial_shape + (kernel_shape[-1],)
+        )
+    else:
+        output_shape = (input_shape[0], kernel_shape[-1]) + output_spatial_shape
+    return output_shape
+
+
+def compute_matmul_output_shape(shape1, shape2):
+    """Compute the output shape of a `matmul` operation.
+
+    Args:
+        shape1: Shape of the left operand.
+        shape2: Shape of the right operand.
+
+    Returns:
+        Tuple of ints: The output shape for the `matmul` operation.
+    """
+    if len(shape1) == 1:
+        shape1 = (1, shape1[0])
+    if len(shape2) == 1:
+        shape2 = (shape2[0], 1)
+    if (
+        shape1[-1] is not None
+        and shape2[-2] is not None
+        and shape1[-1] != shape2[-2]
+    ):
+        raise ValueError(
+            "Inner dimensions (`x1.shape[-1]` and `x2.shape[-2]`) must be "
+            f"equal, but received `x1.shape={shape1}` and "
+            f"`x2.shape={shape2}`."
+        )
+
+    leading_shape = broadcast_shapes(shape1[:-2], shape2[:-2])
+    last_2_dims_shape = [shape1[-2], shape2[-1]]
+    output_shape = leading_shape + last_2_dims_shape
+    if len(shape1) == 1:
+        del output_shape[-2]
+    if len(shape2) == 1:
+        del output_shape[-1]
+    return tuple(output_shape)
+
+
+def compute_reshape_output_shape(input_shape, newshape, newshape_arg_name):
+    """Converts `-1` in `newshape` to either an actual dimension or `None`.
+
+    This utility does not special case the 0th dimension (batch size).
+    """
+    unknown_dim_count = newshape.count(-1)
+    if unknown_dim_count > 1:
+        raise ValueError(
+            "There must be at most one unknown dimension (-1) in "
+            f"{newshape_arg_name}. Received: {newshape_arg_name}={newshape}."
+        )
+
+    # If there is a None in input_shape, we can't infer what the -1 is
+    if None in input_shape:
+        return tuple(dim if dim != -1 else None for dim in newshape)
+
+    input_size = math.prod(input_shape)
+    # If the `newshape` is fully defined, return it
+    if unknown_dim_count == 0:
+        if input_size != math.prod(newshape):
+            raise ValueError(
+                "The total size of the tensor must be unchanged. Received: "
+                f"input_shape={input_shape}, {newshape_arg_name}={newshape}"
+            )
+        return newshape
+
+    # We have one -1 in `newshape`, compute the actual value
+    known_output_size = 1
+    unknown_dim_index = None
+    for index, dim in enumerate(newshape):
+        if dim == -1:
+            unknown_dim_index = index
+        else:
+            known_output_size *= dim
+
+    if known_output_size == 0 or input_size % known_output_size != 0:
+        raise ValueError(
+            "The total size of the tensor must be unchanged, however, the "
+            "input size cannot by divided by the specified dimensions in "
+            f"{newshape_arg_name}. Received: input_shape={input_shape}, "
+            f"{newshape_arg_name}={newshape}"
+        )
+
+    output_shape = list(newshape)
+    output_shape[unknown_dim_index] = input_size // known_output_size
+    return tuple(output_shape)
+
+
+def compute_transpose_output_shape(input_shape, axes):
+    """Compute the output shape for the `transpose` operation.
+
+    Args:
+        input_shape: Input shape.
+        axes: Permutation of the dimensions for the `transpose` operation.
+
+    Returns:
+        Tuple of ints: The output shape after the `transpose` operation.
+    """
+    input_shape = list(input_shape)
+    if axes is None:
+        return tuple(input_shape[::-1])
+
+    if len(axes) != len(input_shape):
+        raise ValueError(
+            "axis must be a list of the same length as the input shape, "
+            f"expected {len(input_shape)}, but received {len(axes)}."
+        )
+    return tuple(input_shape[ax] for ax in axes)
+
+
+def compute_take_along_axis_output_shape(input_shape, indices_shape, axis):
+    input_shape = list(input_shape)
+    indices_shape = list(indices_shape)
+    if axis is None:
+        input_shape = (
+            [None] if None in input_shape else [int(np.prod(input_shape))]
+        )
+
+    if len(input_shape) != len(indices_shape):
+        raise ValueError(
+            "`x` and `indices` must have the same number of dimensions, "
+            f"but receive shape {input_shape} and {indices_shape}."
+        )
+
+    input_shape[axis] = indices_shape[axis]
+    output_shape = broadcast_shapes(input_shape, indices_shape)
+    return output_shape
+
+
+def reduce_shape(shape, axis=None, keepdims=False):
+    shape = list(shape)
+    if axis is None:
+        if keepdims:
+            return tuple([1 for _ in shape])
+        else:
+            return tuple([])
+
+    if keepdims:
+        for ax in axis:
+            shape[ax] = 1
+        return tuple(shape)
+    else:
+        for ax in sorted(axis, reverse=True):
+            del shape[ax]
+        return tuple(shape)
+
+
+@keras_export("keras.utils.get_source_inputs")
+def get_source_inputs(tensor):
+    """Returns the list of input tensors necessary to compute `tensor`.
+
+    Output will always be a list of tensors
+    (potentially with 1 element).
+
+    Args:
+        tensor: The tensor to start from.
+
+    Returns:
+        List of input tensors.
+    """
+    if not hasattr(tensor, "_keras_history"):
+        return tensor
+
+    operation, node_index, _ = tensor._keras_history
+    if not operation or not operation._inbound_nodes:
+        return [tensor]
+    else:
+        node = operation._inbound_nodes[node_index]
+        if node.is_input:
+            # Reached input node, stop recursion.
+            return tree.flatten(node.output_tensors)
+        else:
+            source_tensors = []
+            for tensor in node.input_tensors:
+                previous_sources = get_source_inputs(tensor)
+                # Avoid input redundancy.
+                for x in previous_sources:
+                    if all(x is not t for t in source_tensors):
+                        source_tensors.append(x)
+            return source_tensors
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/symbolic_arguments.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/symbolic_arguments.py
new file mode 100644
index 0000000000000000000000000000000000000000..c71e04e7b1456ffea89e3a473a6cd62d09f07030
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/ops/symbolic_arguments.py
@@ -0,0 +1,46 @@
+from keras.src import tree
+from keras.src.backend import KerasTensor
+
+
+class SymbolicArguments:
+    def __init__(self, *args, **kwargs):
+        self.args = tree.map_structure(lambda x: x, args)
+        self.kwargs = tree.map_structure(lambda x: x, kwargs)
+        self._flat_arguments = tree.flatten((self.args, self.kwargs))
+
+        # Used to avoid expensive `tree` operations in the most common case.
+        if (
+            not self.kwargs
+            and len(self.args) == 1
+            and isinstance(self.args[0], KerasTensor)
+        ):
+            self._single_positional_tensor = self.args[0]
+        else:
+            self._single_positional_tensor = None
+
+        self.keras_tensors = []
+        for arg in self._flat_arguments:
+            if isinstance(arg, KerasTensor):
+                self.keras_tensors.append(arg)
+
+    def convert(self, conversion_fn):
+        args = tree.map_structure(conversion_fn, self.args)
+        kwargs = tree.map_structure(conversion_fn, self.kwargs)
+        return args, kwargs
+
+    def fill_in(self, tensor_dict):
+        """Maps KerasTensors to computed values using `tensor_dict`.
+
+        `tensor_dict` maps `KerasTensor` instances to their current values.
+        """
+        if self._single_positional_tensor is not None:
+            # Performance optimization for most common case.
+            # Approx. 70x faster.
+            return (tensor_dict[id(self._single_positional_tensor)],), {}
+
+        def switch_fn(x):
+            if isinstance(x, KerasTensor):
+                return tensor_dict.get(id(x), None)
+            return x
+
+        return self.convert(switch_fn)
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__init__.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..d00c96d989543f5c262795d6db21432585739887
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__init__.py
@@ -0,0 +1,121 @@
+from keras.src.api_export import keras_export
+from keras.src.optimizers.adadelta import Adadelta
+from keras.src.optimizers.adafactor import Adafactor
+from keras.src.optimizers.adagrad import Adagrad
+from keras.src.optimizers.adam import Adam
+from keras.src.optimizers.adamax import Adamax
+from keras.src.optimizers.adamw import AdamW
+from keras.src.optimizers.ftrl import Ftrl
+from keras.src.optimizers.lion import Lion
+from keras.src.optimizers.loss_scale_optimizer import LossScaleOptimizer
+from keras.src.optimizers.nadam import Nadam
+from keras.src.optimizers.optimizer import Optimizer
+from keras.src.optimizers.rmsprop import RMSprop
+from keras.src.optimizers.sgd import SGD
+from keras.src.saving import serialization_lib
+
+ALL_OBJECTS = {
+    Optimizer,
+    Adam,
+    SGD,
+    RMSprop,
+    Adadelta,
+    AdamW,
+    Adagrad,
+    Adamax,
+    Adafactor,
+    Nadam,
+    Ftrl,
+    Lion,
+    LossScaleOptimizer,
+}
+ALL_OBJECTS_DICT = {cls.__name__.lower(): cls for cls in ALL_OBJECTS}
+
+
+@keras_export("keras.optimizers.serialize")
+def serialize(optimizer):
+    """Returns the optimizer configuration as a Python dict.
+
+    Args:
+        optimizer: An `Optimizer` instance to serialize.
+
+    Returns:
+        Python dict which contains the configuration of the optimizer.
+    """
+    return serialization_lib.serialize_keras_object(optimizer)
+
+
+@keras_export("keras.optimizers.deserialize")
+def deserialize(config, custom_objects=None):
+    """Returns a Keras optimizer object via its configuration.
+
+    Args:
+        config: Optimizer configuration dictionary.
+        custom_objects: Optional dictionary mapping names (strings) to custom
+            objects (classes and functions) to be considered during
+            deserialization.
+
+    Returns:
+        A Keras Optimizer instance.
+    """
+    # Make deserialization case-insensitive for built-in optimizers.
+    if config["class_name"].lower() in ALL_OBJECTS_DICT:
+        config["class_name"] = config["class_name"].lower()
+
+    return serialization_lib.deserialize_keras_object(
+        config,
+        module_objects=ALL_OBJECTS_DICT,
+        custom_objects=custom_objects,
+    )
+
+
+@keras_export("keras.optimizers.get")
+def get(identifier):
+    """Retrieves a Keras Optimizer instance.
+
+    Args:
+        identifier: Optimizer identifier, one of:
+            - String: name of an optimizer
+            - Dictionary: configuration dictionary.
+            - Keras Optimizer instance (it will be returned unchanged).
+
+    Returns:
+        A Keras Optimizer instance.
+    """
+    if identifier is None:
+        return None
+    elif isinstance(identifier, dict):
+        obj = deserialize(identifier)
+    elif isinstance(identifier, str):
+        config = {"class_name": identifier, "config": {}}
+        obj = deserialize(config)
+    else:
+        obj = identifier
+
+    if isinstance(obj, Optimizer):
+        return obj
+    raise ValueError(f"Could not interpret optimizer identifier: {identifier}")
+
+
+# We will add this temporarily so that tensorflow packages that depend on
+# estimators will continue to import (there are a large number). Note that
+# Keras 3 will not work with the estimators API.
+@keras_export(
+    [
+        "keras.optimizers.legacy.Adagrad",
+        "keras.optimizers.legacy.Adam",
+        "keras.optimizers.legacy.Ftrl",
+        "keras.optimizers.legacy.RMSprop",
+        "keras.optimizers.legacy.SGD",
+        "keras.optimizers.legacy.Optimizer",
+    ]
+)
+class LegacyOptimizerWarning:
+    def __init__(self, *args, **kwargs):
+        raise ImportError(
+            "`keras.optimizers.legacy` is not supported in Keras 3. When using "
+            "`tf.keras`, to continue using a `tf.keras.optimizers.legacy` "
+            "optimizer, you can install the `tf_keras` package (Keras 2) and "
+            "set the environment variable `TF_USE_LEGACY_KERAS=True` to "
+            "configure TensorFlow to use `tf_keras` when accessing `tf.keras`."
+        )
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/__init__.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/__init__.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..8be4db0bf8314a19ec6bbdc9d6af330274f15063
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/__init__.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/adadelta.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/adadelta.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..7662b5185d9134958677e8b90a2218f727292451
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/adadelta.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/adafactor.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/adafactor.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..933338e60f28976f36389a001044bd7a7c34e87c
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/adafactor.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/adagrad.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/adagrad.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..bf6cd16963f9cdb37af4434ff0a2bbd6bfd4920e
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/adagrad.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/adam.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/adam.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..2b73869feeb40075c6f5c652d1287680bca294d2
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/adam.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/adamax.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/adamax.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..9f5f5ca42fe8cb236d88eb0261cb1035be4558cf
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/adamax.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/adamw.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/adamw.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..001e538da84a6f8b3e8c05723c1f32087c4d8fe3
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/adamw.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/base_optimizer.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/base_optimizer.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..6b13f92606a50558833b7c268b72b911d28710b5
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/base_optimizer.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/ftrl.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/ftrl.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..927a62f289f59243eccd65f44b3c4a8dc0e24e71
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/ftrl.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/lamb.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/lamb.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..dff7ec4334d87bb8af21a7996a4770299614265b
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/lamb.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/lion.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/lion.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..f7d454a7da019cf6bceed3e53c90019848f81826
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/lion.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/loss_scale_optimizer.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/loss_scale_optimizer.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..a701228b7c14fa438a167437cc35158c6cd21fd6
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/loss_scale_optimizer.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/nadam.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/nadam.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..3f141123a41a2dc1e2618b3c42b3050b25b907dd
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/nadam.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/optimizer.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/optimizer.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..295ba9ce10eef26ab52a903c85649594fb53539b
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/optimizer.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/rmsprop.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/rmsprop.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..d635bd2e15f6a65caedd13f262e8d38e33773750
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/rmsprop.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/sgd.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/sgd.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..ff68b34eaf35b26a4c72463e3cf7665b2451e35b
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/__pycache__/sgd.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/adadelta.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/adadelta.py
new file mode 100644
index 0000000000000000000000000000000000000000..4ec7d936c2427334e76a6403d408779b4c7faa80
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/adadelta.py
@@ -0,0 +1,139 @@
+from keras.src import ops
+from keras.src.api_export import keras_export
+from keras.src.optimizers import optimizer
+
+
+@keras_export(["keras.optimizers.Adadelta"])
+class Adadelta(optimizer.Optimizer):
+    """Optimizer that implements the Adadelta algorithm.
+
+    Adadelta optimization is a stochastic gradient descent method that is based
+    on adaptive learning rate per dimension to address two drawbacks:
+
+    - The continual decay of learning rates throughout training.
+    - The need for a manually selected global learning rate.
+
+    Adadelta is a more robust extension of Adagrad that adapts learning rates
+    based on a moving window of gradient updates, instead of accumulating all
+    past gradients. This way, Adadelta continues learning even when many updates
+    have been done. Compared to Adagrad, in the original version of Adadelta you
+    don't have to set an initial learning rate. In this version, the initial
+    learning rate can be set, as in most other Keras optimizers.
+
+    Args:
+        learning_rate: A float, a
+            `keras.optimizers.schedules.LearningRateSchedule` instance, or
+            a callable that takes no arguments and returns the actual value to
+            use. The learning rate. Defaults to `0.001`. Note that `Adadelta`
+            tends to benefit from higher initial learning rate values compared
+            to other optimizers. To match the exact form in the original paper,
+            use 1.0.
+        rho: A floating point value. The decay rate. Defaults to `0.95`.
+        epsilon: Small floating point value for maintaining numerical stability.
+        {{base_optimizer_keyword_args}}
+
+    Reference:
+
+    - [Zeiler, 2012](http://arxiv.org/abs/1212.5701)
+    """
+
+    def __init__(
+        self,
+        learning_rate=0.001,
+        rho=0.95,
+        epsilon=1e-7,
+        weight_decay=None,
+        clipnorm=None,
+        clipvalue=None,
+        global_clipnorm=None,
+        use_ema=False,
+        ema_momentum=0.99,
+        ema_overwrite_frequency=None,
+        loss_scale_factor=None,
+        gradient_accumulation_steps=None,
+        name="adadelta",
+        **kwargs,
+    ):
+        super().__init__(
+            learning_rate=learning_rate,
+            weight_decay=weight_decay,
+            clipnorm=clipnorm,
+            clipvalue=clipvalue,
+            global_clipnorm=global_clipnorm,
+            use_ema=use_ema,
+            ema_momentum=ema_momentum,
+            ema_overwrite_frequency=ema_overwrite_frequency,
+            loss_scale_factor=loss_scale_factor,
+            gradient_accumulation_steps=gradient_accumulation_steps,
+            name=name,
+            **kwargs,
+        )
+        self.rho = rho
+        self.epsilon = epsilon
+
+    def build(self, var_list):
+        if self.built:
+            return
+        super().build(var_list)
+        self._accumulated_grads = []
+        self._accumulated_delta_vars = []
+        for var in var_list:
+            self._accumulated_grads.append(
+                self.add_variable_from_reference(var, "accumulated_grad")
+            )
+            self._accumulated_delta_vars.append(
+                self.add_variable_from_reference(var, "accumulated_delta_var")
+            )
+
+    def update_step(self, grad, variable, learning_rate):
+        """Update step given gradient and the associated model variable."""
+        lr = ops.cast(learning_rate, variable.dtype)
+        grad = ops.cast(grad, variable.dtype)
+
+        rho = self.rho
+        accumulated_grad = self._accumulated_grads[
+            self._get_variable_index(variable)
+        ]
+        accumulated_delta_var = self._accumulated_delta_vars[
+            self._get_variable_index(variable)
+        ]
+
+        def rms(x):
+            return ops.sqrt(ops.add(x, self.epsilon))
+
+        self.assign(
+            accumulated_grad,
+            ops.add(
+                rho * accumulated_grad, ops.multiply(1 - rho, ops.square(grad))
+            ),
+        )
+        delta_var = ops.negative(
+            ops.divide(
+                ops.multiply(rms(accumulated_delta_var), grad),
+                rms(accumulated_grad),
+            )
+        )
+        self.assign(
+            accumulated_delta_var,
+            ops.add(
+                ops.multiply(rho, accumulated_delta_var),
+                ops.multiply(1 - rho, ops.square(delta_var)),
+            ),
+        )
+        self.assign_add(variable, ops.multiply(lr, delta_var))
+
+    def get_config(self):
+        config = super().get_config()
+
+        config.update(
+            {
+                "rho": self.rho,
+                "epsilon": self.epsilon,
+            }
+        )
+        return config
+
+
+Adadelta.__doc__ = Adadelta.__doc__.replace(
+    "{{base_optimizer_keyword_args}}", optimizer.base_optimizer_keyword_args
+)
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/adafactor.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/adafactor.py
new file mode 100644
index 0000000000000000000000000000000000000000..bf94b6f37fb5b168385b4bb4493d5db19e2fbe72
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/adafactor.py
@@ -0,0 +1,208 @@
+from keras.src import backend
+from keras.src import ops
+from keras.src.api_export import keras_export
+from keras.src.optimizers import optimizer
+
+
+@keras_export(["keras.optimizers.Adafactor"])
+class Adafactor(optimizer.Optimizer):
+    """Optimizer that implements the Adafactor algorithm.
+
+    Adafactor is commonly used in NLP tasks, and has the advantage
+    of taking less memory because it only saves partial information of previous
+    gradients.
+
+    The default argument setup is based on the original paper (see reference).
+    When gradients are of dimension > 2, Adafactor optimizer will delete the
+    last 2 dimensions separately in its accumulator variables.
+
+    Args:
+        learning_rate: A float, a
+            `keras.optimizers.schedules.LearningRateSchedule` instance, or
+            a callable that takes no arguments and returns the actual value to
+            use. The learning rate. Defaults to `0.001`.
+        beta_2_decay: float, defaults to -0.8. The decay rate of `beta_2`.
+        epsilon_1: float, defaults to 1e-30. A small offset to keep denominator
+            away from 0.
+        epsilon_2: float, defaults to 1e-3. A small offset to avoid learning
+            rate becoming too small by time.
+        clip_threshold: float, defaults to 1.0. Clipping threshold. This is a
+            part of Adafactor algorithm, independent from `clipnorm`,
+            `clipvalue`, and `global_clipnorm`.
+        relative_step: bool, defaults to `True`. If `learning_rate` is a
+            constant and `relative_step=True`, learning rate will be adjusted
+            based on current iterations. This is a default learning rate decay
+            in Adafactor.
+        {{base_optimizer_keyword_args}}
+
+    Reference:
+
+    - [Shazeer, Noam et al., 2018](https://arxiv.org/abs/1804.04235).
+
+    """
+
+    def __init__(
+        self,
+        learning_rate=0.001,
+        beta_2_decay=-0.8,
+        epsilon_1=1e-30,
+        epsilon_2=1e-3,
+        clip_threshold=1.0,
+        relative_step=True,
+        weight_decay=None,
+        clipnorm=None,
+        clipvalue=None,
+        global_clipnorm=None,
+        use_ema=False,
+        ema_momentum=0.99,
+        ema_overwrite_frequency=None,
+        loss_scale_factor=None,
+        gradient_accumulation_steps=None,
+        name="adafactor",
+        **kwargs,
+    ):
+        super().__init__(
+            learning_rate=learning_rate,
+            name=name,
+            weight_decay=weight_decay,
+            clipnorm=clipnorm,
+            clipvalue=clipvalue,
+            global_clipnorm=global_clipnorm,
+            use_ema=use_ema,
+            ema_momentum=ema_momentum,
+            ema_overwrite_frequency=ema_overwrite_frequency,
+            loss_scale_factor=loss_scale_factor,
+            gradient_accumulation_steps=gradient_accumulation_steps,
+            **kwargs,
+        )
+        self.beta_2_decay = beta_2_decay
+        self.epsilon_1 = epsilon_1
+        self.epsilon_2 = epsilon_2
+        self.clip_threshold = clip_threshold
+        self.relative_step = relative_step
+
+    def build(self, var_list):
+        """Initialize optimizer variables.
+
+        Adam optimizer has 3 types of variables: momentums, velocities and
+        velocity_hat (only set when amsgrad is applied),
+
+        Args:
+            var_list: list of model variables to build Adam variables on.
+        """
+        if self.built:
+            return
+        super().build(var_list)
+        self._r = []
+        self._c = []
+        self._v = []
+        for var in var_list:
+            if len(var.shape) < 2:
+                # Don't factor if variable is of dimension < 2, but we still
+                # need to create dummy variables as placeholder.
+                with backend.name_scope(self.name, caller=self):
+                    self._r.append(
+                        backend.Variable(0, name=var.name, trainable=False)
+                    )
+                    self._c.append(
+                        backend.Variable(0, name=var.name, trainable=False)
+                    )
+            else:
+                # Always factor the last 2 dimensions.
+                r_shape = var.shape[:-1]
+                c_shape = var.shape[:-2] + (var.shape[-1],)
+                self._r.append(
+                    self.add_variable(
+                        shape=r_shape,
+                        dtype=var.dtype,
+                        name=var.name,
+                    )
+                )
+                self._c.append(
+                    self.add_variable(
+                        shape=c_shape,
+                        dtype=var.dtype,
+                        name=var.name,
+                    )
+                )
+            self._v.append(
+                self.add_variable_from_reference(
+                    reference_variable=var, name="velocity"
+                )
+            )
+
+    def _rms(self, x):
+        return ops.sqrt(ops.mean(ops.square(x)))
+
+    def update_step(self, gradient, variable, learning_rate):
+        """Update step given gradient and the associated model variable."""
+
+        lr = ops.cast(learning_rate, variable.dtype)
+        gradient = ops.cast(gradient, variable.dtype)
+        epsilon_2 = ops.cast(self.epsilon_2, variable.dtype)
+        one = ops.cast(1.0, variable.dtype)
+        local_step = ops.cast(self.iterations + 1, variable.dtype)
+        if not callable(self._learning_rate) and self.relative_step:
+            lr = ops.minimum(lr, 1 / ops.sqrt(local_step))
+
+        r = self._r[self._get_variable_index(variable)]
+        c = self._c[self._get_variable_index(variable)]
+        v = self._v[self._get_variable_index(variable)]
+
+        rho_t = ops.minimum(lr, 1 / ops.sqrt(local_step))
+        alpha_t = ops.maximum(epsilon_2, self._rms(variable)) * rho_t
+        regulated_grad_square = ops.add(ops.square(gradient), self.epsilon_1)
+        beta_2_t = 1 - ops.power(local_step, self.beta_2_decay)
+
+        if len(variable.shape) >= 2:
+            # `r` deletes the last dimension of gradient, so it is of shape
+            # `gradient.shape[:-1]`.
+            self.assign(
+                r,
+                beta_2_t * r
+                + (1 - beta_2_t) * ops.mean(regulated_grad_square, axis=-1),
+            )
+            # `c` deletes the second last dimension of gradient, so it is of
+            # shape `gradient.shape[:-2] + gradient.shape[-1]`.
+            self.assign(
+                c,
+                beta_2_t * c
+                + (1 - beta_2_t) * ops.mean(regulated_grad_square, axis=-2),
+            )
+            self.assign(
+                v,
+                ops.expand_dims(
+                    r / ops.mean(r, axis=-1, keepdims=True), axis=-1
+                )
+                * ops.expand_dims(c, -2),
+            )
+        else:
+            self.assign(
+                v, beta_2_t * v + (1 - beta_2_t) * regulated_grad_square
+            )
+
+        u_t = ops.divide(gradient, ops.sqrt(v))
+        u_t_hat = ops.divide(
+            u_t,
+            ops.maximum(one, ops.divide(self._rms(u_t), self.clip_threshold)),
+        )
+        self.assign_sub(variable, ops.multiply(alpha_t, u_t_hat))
+
+    def get_config(self):
+        config = super().get_config()
+
+        config.update(
+            {
+                "beta_2_decay": self.beta_2_decay,
+                "epsilon_1": self.epsilon_1,
+                "epsilon_2": self.epsilon_2,
+                "clip_threshold": self.clip_threshold,
+                "relative_step": self.relative_step,
+            }
+        )
+        return config
+
+
+Adafactor.__doc__ = Adafactor.__doc__.replace(
+    "{{base_optimizer_keyword_args}}", optimizer.base_optimizer_keyword_args
+)
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/adagrad.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/adagrad.py
new file mode 100644
index 0000000000000000000000000000000000000000..856a6c24e0b691ba721a6c93ce535e9eb253a428
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/adagrad.py
@@ -0,0 +1,115 @@
+from keras.src import initializers
+from keras.src import ops
+from keras.src.api_export import keras_export
+from keras.src.optimizers import optimizer
+
+
+@keras_export(["keras.optimizers.Adagrad"])
+class Adagrad(optimizer.Optimizer):
+    """Optimizer that implements the Adagrad algorithm.
+
+    Adagrad is an optimizer with parameter-specific learning rates,
+    which are adapted relative to how frequently a parameter gets
+    updated during training. The more updates a parameter receives,
+    the smaller the updates.
+
+    Args:
+        learning_rate: A float, a
+            `keras.optimizers.schedules.LearningRateSchedule` instance, or
+            a callable that takes no arguments and returns the actual value to
+            use. The learning rate. Defaults to `0.001`. Note that `Adagrad`
+            tends to benefit from higher initial learning rate values compared
+            to other optimizers. To match the exact form in the original paper,
+            use `1.0`.
+        initial_accumulator_value: Floating point value. Starting value for the
+            accumulators (per-parameter momentum values). Must be non-negative.
+        epsilon: Small floating point value for maintaining numerical stability.
+        {{base_optimizer_keyword_args}}
+
+    Reference:
+
+    - [Duchi et al., 2011](
+        http://www.jmlr.org/papers/volume12/duchi11a/duchi11a.pdf).
+    """
+
+    def __init__(
+        self,
+        learning_rate=0.001,
+        initial_accumulator_value=0.1,
+        epsilon=1e-7,
+        weight_decay=None,
+        clipnorm=None,
+        clipvalue=None,
+        global_clipnorm=None,
+        use_ema=False,
+        ema_momentum=0.99,
+        ema_overwrite_frequency=None,
+        loss_scale_factor=None,
+        gradient_accumulation_steps=None,
+        name="adagrad",
+        **kwargs,
+    ):
+        super().__init__(
+            learning_rate=learning_rate,
+            weight_decay=weight_decay,
+            clipnorm=clipnorm,
+            clipvalue=clipvalue,
+            global_clipnorm=global_clipnorm,
+            use_ema=use_ema,
+            ema_momentum=ema_momentum,
+            ema_overwrite_frequency=ema_overwrite_frequency,
+            loss_scale_factor=loss_scale_factor,
+            gradient_accumulation_steps=gradient_accumulation_steps,
+            name=name,
+            **kwargs,
+        )
+        self.initial_accumulator_value = initial_accumulator_value
+        self.epsilon = epsilon
+
+    def build(self, var_list):
+        if self.built:
+            return
+        super().build(var_list)
+        self._accumulators = []
+        initializer = initializers.Constant(self.initial_accumulator_value)
+        for var in var_list:
+            self._accumulators.append(
+                self.add_variable(
+                    shape=var.shape,
+                    initializer=initializer,
+                    dtype=var.dtype,
+                    name="accumulator",
+                )
+            )
+
+    def update_step(self, gradient, variable, learning_rate):
+        """Update step given gradient and the associated model variable."""
+        lr = ops.cast(learning_rate, variable.dtype)
+        gradient = ops.cast(gradient, variable.dtype)
+
+        accumulator = self._accumulators[self._get_variable_index(variable)]
+
+        self.assign_add(accumulator, ops.square(gradient))
+        self.assign_sub(
+            variable,
+            ops.divide(
+                ops.multiply(lr, gradient),
+                ops.sqrt(ops.add(accumulator, self.epsilon)),
+            ),
+        )
+
+    def get_config(self):
+        config = super().get_config()
+
+        config.update(
+            {
+                "initial_accumulator_value": self.initial_accumulator_value,
+                "epsilon": self.epsilon,
+            }
+        )
+        return config
+
+
+Adagrad.__doc__ = Adagrad.__doc__.replace(
+    "{{base_optimizer_keyword_args}}", optimizer.base_optimizer_keyword_args
+)
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/adam.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/adam.py
new file mode 100644
index 0000000000000000000000000000000000000000..b7da957e74ce047ad3c4e12fcbd404bc6640db29
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/adam.py
@@ -0,0 +1,167 @@
+from keras.src import ops
+from keras.src.api_export import keras_export
+from keras.src.optimizers import optimizer
+
+
+@keras_export(["keras.optimizers.Adam"])
+class Adam(optimizer.Optimizer):
+    """Optimizer that implements the Adam algorithm.
+
+    Adam optimization is a stochastic gradient descent method that is based on
+    adaptive estimation of first-order and second-order moments.
+
+    According to
+    [Kingma et al., 2014](http://arxiv.org/abs/1412.6980),
+    the method is "*computationally
+    efficient, has little memory requirement, invariant to diagonal rescaling of
+    gradients, and is well suited for problems that are large in terms of
+    data/parameters*".
+
+    Args:
+        learning_rate: A float, a
+            `keras.optimizers.schedules.LearningRateSchedule` instance, or
+            a callable that takes no arguments and returns the actual value to
+            use. The learning rate. Defaults to `0.001`.
+        beta_1: A float value or a constant float tensor, or a callable
+            that takes no arguments and returns the actual value to use. The
+            exponential decay rate for the 1st moment estimates. Defaults to
+            `0.9`.
+        beta_2: A float value or a constant float tensor, or a callable
+            that takes no arguments and returns the actual value to use. The
+            exponential decay rate for the 2nd moment estimates. Defaults to
+            `0.999`.
+        epsilon: A small constant for numerical stability. This epsilon is
+            "epsilon hat" in the Kingma and Ba paper (in the formula just before
+            Section 2.1), not the epsilon in Algorithm 1 of the paper. Defaults
+            to `1e-7`.
+        amsgrad: Boolean. Whether to apply AMSGrad variant of this algorithm
+            from the paper "On the Convergence of Adam and beyond". Defaults
+            to `False`.
+        {{base_optimizer_keyword_args}}
+    """
+
+    def __init__(
+        self,
+        learning_rate=0.001,
+        beta_1=0.9,
+        beta_2=0.999,
+        epsilon=1e-7,
+        amsgrad=False,
+        weight_decay=None,
+        clipnorm=None,
+        clipvalue=None,
+        global_clipnorm=None,
+        use_ema=False,
+        ema_momentum=0.99,
+        ema_overwrite_frequency=None,
+        loss_scale_factor=None,
+        gradient_accumulation_steps=None,
+        name="adam",
+        **kwargs,
+    ):
+        super().__init__(
+            learning_rate=learning_rate,
+            name=name,
+            weight_decay=weight_decay,
+            clipnorm=clipnorm,
+            clipvalue=clipvalue,
+            global_clipnorm=global_clipnorm,
+            use_ema=use_ema,
+            ema_momentum=ema_momentum,
+            ema_overwrite_frequency=ema_overwrite_frequency,
+            loss_scale_factor=loss_scale_factor,
+            gradient_accumulation_steps=gradient_accumulation_steps,
+            **kwargs,
+        )
+        self.beta_1 = beta_1
+        self.beta_2 = beta_2
+        self.epsilon = epsilon
+        self.amsgrad = amsgrad
+
+    def build(self, var_list):
+        """Initialize optimizer variables.
+
+        Adam optimizer has 3 types of variables: momentums, velocities and
+        velocity_hat (only set when amsgrad is applied),
+
+        Args:
+            var_list: list of model variables to build Adam variables on.
+        """
+        if self.built:
+            return
+        super().build(var_list)
+        self._momentums = []
+        self._velocities = []
+        for var in var_list:
+            self._momentums.append(
+                self.add_variable_from_reference(
+                    reference_variable=var, name="momentum"
+                )
+            )
+            self._velocities.append(
+                self.add_variable_from_reference(
+                    reference_variable=var, name="velocity"
+                )
+            )
+        if self.amsgrad:
+            self._velocity_hats = []
+            for var in var_list:
+                self._velocity_hats.append(
+                    self.add_variable_from_reference(
+                        reference_variable=var, name="velocity_hat"
+                    )
+                )
+
+    def update_step(self, gradient, variable, learning_rate):
+        """Update step given gradient and the associated model variable."""
+        lr = ops.cast(learning_rate, variable.dtype)
+        gradient = ops.cast(gradient, variable.dtype)
+        local_step = ops.cast(self.iterations + 1, variable.dtype)
+        beta_1_power = ops.power(
+            ops.cast(self.beta_1, variable.dtype), local_step
+        )
+        beta_2_power = ops.power(
+            ops.cast(self.beta_2, variable.dtype), local_step
+        )
+
+        m = self._momentums[self._get_variable_index(variable)]
+        v = self._velocities[self._get_variable_index(variable)]
+
+        alpha = lr * ops.sqrt(1 - beta_2_power) / (1 - beta_1_power)
+
+        self.assign_add(
+            m, ops.multiply(ops.subtract(gradient, m), 1 - self.beta_1)
+        )
+        self.assign_add(
+            v,
+            ops.multiply(
+                ops.subtract(ops.square(gradient), v), 1 - self.beta_2
+            ),
+        )
+        if self.amsgrad:
+            v_hat = self._velocity_hats[self._get_variable_index(variable)]
+            self.assign(v_hat, ops.maximum(v_hat, v))
+            v = v_hat
+        self.assign_sub(
+            variable,
+            ops.divide(
+                ops.multiply(m, alpha), ops.add(ops.sqrt(v), self.epsilon)
+            ),
+        )
+
+    def get_config(self):
+        config = super().get_config()
+        config.update(
+            {
+                "beta_1": self.beta_1,
+                "beta_2": self.beta_2,
+                "epsilon": self.epsilon,
+                "amsgrad": self.amsgrad,
+            }
+        )
+        return config
+
+
+Adam.__doc__ = Adam.__doc__.replace(
+    "{{base_optimizer_keyword_args}}", optimizer.base_optimizer_keyword_args
+)
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/adamax.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/adamax.py
new file mode 100644
index 0000000000000000000000000000000000000000..f1d816475c4cf27a68cd866f9bd0306220be3aef
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/adamax.py
@@ -0,0 +1,156 @@
+from keras.src import ops
+from keras.src.api_export import keras_export
+from keras.src.optimizers import optimizer
+
+
+@keras_export(["keras.optimizers.Adamax"])
+class Adamax(optimizer.Optimizer):
+    """Optimizer that implements the Adamax algorithm.
+
+    Adamax, a variant of Adam based on the infinity norm, is a first-order
+    gradient-based optimization method. Due to its capability of adjusting the
+    learning rate based on data characteristics, it is suited to learn
+    time-variant process, e.g., speech data with dynamically changed noise
+    conditions. Default parameters follow those provided in the paper (see
+    references below).
+
+    Initialization:
+
+    ```python
+    m = 0  # Initialize initial 1st moment vector
+    u = 0  # Initialize the exponentially weighted infinity norm
+    t = 0  # Initialize timestep
+    ```
+
+    The update rule for parameter `w` with gradient `g` is described at the end
+    of section 7.1 of the paper (see the reference section):
+
+    ```python
+    t += 1
+    m = beta1 * m + (1 - beta) * g
+    u = max(beta2 * u, abs(g))
+    current_lr = learning_rate / (1 - beta1 ** t)
+    w = w - current_lr * m / (u + epsilon)
+    ```
+
+    Args:
+        learning_rate: A float, a
+            `keras.optimizers.schedules.LearningRateSchedule` instance, or
+            a callable that takes no arguments and returns the actual value to
+            use. The learning rate. Defaults to `0.001`.
+        beta_1: A float value or a constant float tensor. The exponential decay
+            rate for the 1st moment estimates.
+        beta_2: A float value or a constant float tensor. The exponential decay
+            rate for the exponentially weighted infinity norm.
+        epsilon: A small constant for numerical stability.
+            {{base_optimizer_keyword_args}}
+
+    Reference:
+
+    - [Kingma et al., 2014](http://arxiv.org/abs/1412.6980)
+    """
+
+    def __init__(
+        self,
+        learning_rate=0.001,
+        beta_1=0.9,
+        beta_2=0.999,
+        epsilon=1e-7,
+        weight_decay=None,
+        clipnorm=None,
+        clipvalue=None,
+        global_clipnorm=None,
+        use_ema=False,
+        ema_momentum=0.99,
+        ema_overwrite_frequency=None,
+        loss_scale_factor=None,
+        gradient_accumulation_steps=None,
+        name="adamax",
+        **kwargs,
+    ):
+        super().__init__(
+            learning_rate=learning_rate,
+            name=name,
+            weight_decay=weight_decay,
+            clipnorm=clipnorm,
+            clipvalue=clipvalue,
+            global_clipnorm=global_clipnorm,
+            use_ema=use_ema,
+            ema_momentum=ema_momentum,
+            ema_overwrite_frequency=ema_overwrite_frequency,
+            loss_scale_factor=loss_scale_factor,
+            gradient_accumulation_steps=gradient_accumulation_steps,
+            **kwargs,
+        )
+        self.beta_1 = beta_1
+        self.beta_2 = beta_2
+        self.epsilon = epsilon
+
+    def build(self, var_list):
+        """Initialize optimizer variables.
+
+        Adamax optimizer has 2 types of variables: momentums (denoted as m),
+        exponentially weighted infinity norm (denoted as u).
+
+        Args:
+            var_list: list of model variables to build Adamax variables on.
+        """
+        if self.built:
+            return
+        super().build(var_list)
+        self._m = []
+        self._u = []
+        for var in var_list:
+            self._m.append(
+                self.add_variable_from_reference(
+                    reference_variable=var, name="momentum"
+                )
+            )
+            self._u.append(
+                self.add_variable_from_reference(
+                    reference_variable=var, name="norm"
+                )
+            )
+
+    def update_step(self, gradient, variable, learning_rate):
+        """Update step given gradient and the associated model variable."""
+        lr = ops.cast(learning_rate, variable.dtype)
+        gradient = ops.cast(gradient, variable.dtype)
+        local_step = ops.cast(self.iterations + 1, variable.dtype)
+        beta_1_power = ops.power(
+            ops.cast(self.beta_1, variable.dtype), local_step
+        )
+
+        m = self._m[self._get_variable_index(variable)]
+        u = self._u[self._get_variable_index(variable)]
+
+        self.assign_add(
+            m, ops.multiply(ops.subtract(gradient, m), (1 - self.beta_1))
+        )
+        self.assign(
+            u, ops.maximum(ops.multiply(self.beta_2, u), ops.abs(gradient))
+        )
+        self.assign_sub(
+            variable,
+            ops.divide(
+                ops.multiply(lr, m),
+                ops.multiply((1 - beta_1_power), ops.add(u, self.epsilon)),
+            ),
+        )
+
+    def get_config(self):
+        config = super().get_config()
+
+        config.update(
+            {
+                "beta_1": self.beta_1,
+                "beta_2": self.beta_2,
+                "epsilon": self.epsilon,
+            }
+        )
+        return config
+
+
+Adamax.__doc__ = Adamax.__doc__.replace(
+    "{{base_optimizer_keyword_args}}", optimizer.base_optimizer_keyword_args
+)
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/adamw.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/adamw.py
new file mode 100644
index 0000000000000000000000000000000000000000..9db4a30094abc30928c8840dbe4f6bfe951803e4
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/adamw.py
@@ -0,0 +1,100 @@
+from keras.src.api_export import keras_export
+from keras.src.optimizers import adam
+from keras.src.optimizers import optimizer
+
+
+@keras_export(["keras.optimizers.AdamW"])
+class AdamW(adam.Adam):
+    """Optimizer that implements the AdamW algorithm.
+
+    AdamW optimization is a stochastic gradient descent method that is based on
+    adaptive estimation of first-order and second-order moments with an added
+    method to decay weights per the techniques discussed in the paper,
+    'Decoupled Weight Decay Regularization' by
+    [Loshchilov, Hutter et al., 2019](https://arxiv.org/abs/1711.05101).
+
+    According to
+    [Kingma et al., 2014](http://arxiv.org/abs/1412.6980),
+    the underlying Adam method is "*computationally
+    efficient, has little memory requirement, invariant to diagonal rescaling of
+    gradients, and is well suited for problems that are large in terms of
+    data/parameters*".
+
+    Args:
+        learning_rate: A float, a
+            `keras.optimizers.schedules.LearningRateSchedule` instance, or
+            a callable that takes no arguments and returns the actual value to
+            use. The learning rate. Defaults to `0.001`.
+        beta_1: A float value or a constant float tensor, or a callable
+            that takes no arguments and returns the actual value to use. The
+            exponential decay rate for the 1st moment estimates.
+            Defaults to `0.9`.
+        beta_2: A float value or a constant float tensor, or a callable
+            that takes no arguments and returns the actual value to use. The
+            exponential decay rate for the 2nd moment estimates.
+            Defaults to `0.999`.
+        epsilon: A small constant for numerical stability. This epsilon is
+            "epsilon hat" in the Kingma and Ba paper (in the formula just
+            before Section 2.1), not the epsilon in Algorithm 1 of the paper.
+            Defaults to 1e-7.
+        amsgrad: Boolean. Whether to apply AMSGrad variant of this algorithm
+            from the paper "On the Convergence of Adam and beyond".
+            Defaults to `False`.
+        {{base_optimizer_keyword_args}}
+
+    References:
+
+    - [Loshchilov et al., 2019](https://arxiv.org/abs/1711.05101)
+    - [Kingma et al., 2014](http://arxiv.org/abs/1412.6980) for `adam`
+    - [Reddi et al., 2018](
+        https://openreview.net/pdf?id=ryQu7f-RZ) for `amsgrad`.
+    """
+
+    def __init__(
+        self,
+        learning_rate=0.001,
+        weight_decay=0.004,
+        beta_1=0.9,
+        beta_2=0.999,
+        epsilon=1e-7,
+        amsgrad=False,
+        clipnorm=None,
+        clipvalue=None,
+        global_clipnorm=None,
+        use_ema=False,
+        ema_momentum=0.99,
+        ema_overwrite_frequency=None,
+        loss_scale_factor=None,
+        gradient_accumulation_steps=None,
+        name="adamw",
+        **kwargs,
+    ):
+        super().__init__(
+            learning_rate=learning_rate,
+            beta_1=beta_1,
+            beta_2=beta_2,
+            epsilon=epsilon,
+            amsgrad=amsgrad,
+            name=name,
+            weight_decay=weight_decay,
+            clipnorm=clipnorm,
+            clipvalue=clipvalue,
+            global_clipnorm=global_clipnorm,
+            use_ema=use_ema,
+            ema_momentum=ema_momentum,
+            ema_overwrite_frequency=ema_overwrite_frequency,
+            loss_scale_factor=loss_scale_factor,
+            gradient_accumulation_steps=gradient_accumulation_steps,
+            **kwargs,
+        )
+
+        if self.weight_decay is None:
+            raise ValueError(
+                "Argument `weight_decay` must be a float. Received: "
+                "weight_decay=None"
+            )
+
+
+AdamW.__doc__ = AdamW.__doc__.replace(
+    "{{base_optimizer_keyword_args}}", optimizer.base_optimizer_keyword_args
+)
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/base_optimizer.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/base_optimizer.py
new file mode 100644
index 0000000000000000000000000000000000000000..57833afadc7e92d88b83dd2e5b04ca2816d74165
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/base_optimizer.py
@@ -0,0 +1,1102 @@
+import re
+import warnings
+
+from keras.src import backend
+from keras.src import initializers
+from keras.src import ops
+from keras.src.optimizers.schedules import learning_rate_schedule
+from keras.src.saving import serialization_lib
+from keras.src.saving.keras_saveable import KerasSaveable
+from keras.src.utils import tracking
+from keras.src.utils.naming import auto_name
+
+
+class BaseOptimizer(KerasSaveable):
+    """Abstract optimizer base class.
+
+    If you intend to create your own optimization algorithm, please inherit from
+    this class and override the following methods:
+
+    - `build`: Create your optimizer-related variables, such as momentum
+        variables in the SGD optimizer.
+    - `update_step`: Implement your optimizer's variable updating logic.
+    - `get_config`: serialization of the optimizer.
+
+    Example:
+
+    ```python
+    class SGD(Optimizer):
+        def __init__(self, **kwargs):
+            super().__init__(**kwargs)
+            self.momentum = 0.9
+
+        def build(self, variables):
+            super().build(variables)
+            self.momentums = []
+            for variable in variables:
+                self.momentums.append(
+                    self.add_variable_from_reference(
+                        reference_variable=variable, name="momentum"
+                    )
+                )
+
+        def update_step(self, gradient, variable, learning_rate):
+            learning_rate = ops.cast(learning_rate, variable.dtype)
+            gradient = ops.cast(gradient, variable.dtype)
+            m = self.momentums[self._get_variable_index(variable)]
+            self.assign(
+                m,
+                ops.subtract(
+                    ops.multiply(m, ops.cast(self.momentum, variable.dtype)),
+                    ops.multiply(gradient, learning_rate),
+                ),
+            )
+            self.assign_add(variable, m)
+
+        def get_config(self):
+            config = super().get_config()
+            config.update(
+                {
+                    "momentum": self.momentum,
+                    "nesterov": self.nesterov,
+                }
+            )
+            return config
+    ```
+    """
+
+    def __init__(
+        self,
+        learning_rate,
+        weight_decay=None,
+        clipnorm=None,
+        clipvalue=None,
+        global_clipnorm=None,
+        use_ema=False,
+        ema_momentum=0.99,
+        ema_overwrite_frequency=None,
+        loss_scale_factor=None,
+        gradient_accumulation_steps=None,
+        name=None,
+        **kwargs,
+    ):
+        self._lock = False
+
+        if kwargs.pop("decay", None) is not None:
+            warnings.warn(
+                "Argument `decay` is no longer supported and will be ignored."
+            )
+        if kwargs:
+            raise ValueError(f"Argument(s) not recognized: {kwargs}")
+
+        if name is None:
+            name = auto_name(self.__class__.__name__)
+        self.name = name
+        self.weight_decay = weight_decay
+        self.clipnorm = clipnorm
+        self.global_clipnorm = global_clipnorm
+        self.clipvalue = clipvalue
+        self.use_ema = use_ema
+        self.loss_scale_factor = loss_scale_factor
+        self.gradient_accumulation_steps = gradient_accumulation_steps
+
+        if gradient_accumulation_steps:
+            if not gradient_accumulation_steps >= 2:
+                raise ValueError(
+                    "`gradient_accumulation_steps` must be an integer >= 2. "
+                    "Received: gradient_accumulation_steps="
+                    f"{gradient_accumulation_steps}"
+                )
+
+        if use_ema:
+            # Verify the arguments related to EMA.
+            if ema_momentum > 1 or ema_momentum < 0:
+                raise ValueError(
+                    "`ema_momentum` must be in the range [0, 1]. "
+                    f"Received: ema_momentum={ema_momentum}"
+                )
+            if ema_overwrite_frequency and (
+                not isinstance(ema_overwrite_frequency, int)
+                or ema_overwrite_frequency < 1
+            ):
+                raise ValueError(
+                    "`ema_overwrite_frequency` must be an integer >= 1 or "
+                    "None. Received: ema_overwrite_frequency="
+                    f"{ema_overwrite_frequency}"
+                )
+        self.ema_momentum = ema_momentum
+        self.ema_overwrite_frequency = ema_overwrite_frequency
+
+        clip_args_sum = sum(
+            a is not None for a in [clipnorm, clipvalue, global_clipnorm]
+        )
+        if clip_args_sum > 1:
+            raise ValueError(
+                "Only one of `clipnorm`, `clipvalue` and `global_clipnorm` can "
+                f"be set. Received: clipnorm={clipnorm}, "
+                f"clipvalue={clipvalue}, global_clipnorm={global_clipnorm}"
+            )
+        self.built = False
+
+        # Set up variable tracking.
+        self._variables = []
+        self._trainable_variables = []
+        self._tracker = tracking.Tracker(
+            {
+                "variables": (
+                    lambda x: isinstance(x, backend.Variable),
+                    self._variables,
+                ),
+            }
+        )
+        self._trainable_variables_indices = {}
+
+        # Create iteration variable
+        # Note: dtype="int" will resolve to int32 in JAX
+        # (since int64 is disallowed in JAX) and to int64 in TF.
+        with backend.name_scope(self.name, caller=self):
+            iterations = backend.Variable(
+                0,
+                name="iteration",
+                dtype="int",
+                trainable=False,
+                aggregation="only_first_replica",
+            )
+        self._track_variable(iterations)
+        self._iterations = iterations
+
+        # Create learning rate (schedule or variable)
+        if isinstance(
+            learning_rate, learning_rate_schedule.LearningRateSchedule
+        ):
+            self._learning_rate = learning_rate
+        elif callable(learning_rate):
+            self._learning_rate = learning_rate
+        else:
+            if not isinstance(learning_rate, float):
+                raise ValueError(
+                    "Argument `learning_rate` should be float, or an instance "
+                    "of LearningRateSchedule, or a callable "
+                    "(that takes in the current iteration value "
+                    "and returns the corresponding learning rate value). "
+                    f"Received instead: learning_rate={learning_rate}"
+                )
+            with backend.name_scope(self.name, caller=self):
+                learning_rate = backend.Variable(
+                    learning_rate,
+                    name="learning_rate",
+                    dtype=backend.floatx(),
+                    trainable=False,
+                    aggregation="only_first_replica",
+                )
+            self._track_variable(learning_rate)
+            self._learning_rate = learning_rate
+
+    @property
+    def iterations(self):
+        if self.gradient_accumulation_steps:
+            return ops.floor_divide(
+                self._iterations, self.gradient_accumulation_steps
+            )
+
+        return self._iterations
+
+    def _track_variable(self, variable):
+        self._tracker.add_to_store("variables", variable)
+
+    @tracking.no_automatic_dependency_tracking
+    def build(self, variables):
+        if self.use_ema:
+            self._model_variables_moving_average = []
+        if self.gradient_accumulation_steps:
+            self._accumulated_gradients = []
+        for i, variable in enumerate(variables):
+            self._trainable_variables_indices[self._var_key(variable)] = i
+            if self.use_ema:
+                self._model_variables_moving_average.append(
+                    self.add_variable_from_reference(
+                        variable,
+                        name="average",
+                    )
+                )
+            if self.gradient_accumulation_steps:
+                self._accumulated_gradients.append(
+                    self.add_variable_from_reference(
+                        variable,
+                        name="gradient_accumulator",
+                    )
+                )
+        self._trainable_variables = variables[:]
+        self.built = True
+
+    def _var_key(self, variable):
+        # Helper function to get a stable ID and the variable instance mapping.
+        return id(variable)
+
+    @property
+    def variables(self):
+        return self._variables[:]
+
+    def _get_variable_index(self, variable):
+        return self._trainable_variables_indices[self._var_key(variable)]
+
+    def add_variable(
+        self,
+        shape,
+        initializer="zeros",
+        dtype=None,
+        aggregation="none",
+        name=None,
+    ):
+        """Add a variable to the optimizer.
+
+        Args:
+            shape: Shape tuple for the variable. Must be fully-defined
+                (no `None` entries).
+            initializer: Initializer object to use to populate the initial
+                variable value, or string name of a built-in initializer
+                (e.g. `"random_normal"`). Defaults to `"zeros"`.
+            dtype: Dtype of the variable to create, e.g. `"float32"`. If
+                unspecified, defaults to the `keras.backend.floatx()`.
+            aggregation: Optional string, one of `None`, `"none"`, `"mean"`,
+                `"sum"` or `"only_first_replica"`. Annotates the variable with
+                the type of multi-replica aggregation to be used for this
+                variable when writing custom data parallel training loops.
+                Defaults to `"none"`.
+            name: String name of the variable. Useful for debugging purposes.
+
+        Returns:
+            An optimizer variable, in the format of `keras.Variable`.
+        """
+        self._check_super_called()
+        initializer = initializers.get(initializer)
+        with backend.name_scope(self.name, caller=self):
+            variable = backend.Variable(
+                initializer=initializer,
+                shape=shape,
+                dtype=dtype,
+                trainable=False,
+                aggregation=aggregation,
+                name=name,
+            )
+        self._track_variable(variable)
+        return variable
+
+    def add_variable_from_reference(
+        self, reference_variable, name=None, initializer="zeros"
+    ):
+        """Add an optimizer variable from the model variable.
+
+        Create an optimizer variable based on the information of model variable.
+        For example, in SGD optimizer momemtum, for each model variable, a
+        corresponding momemtum variable is created of the same shape and dtype.
+
+        Args:
+            reference_variable: `keras.Variable`. The corresponding model
+                variable to the optimizer variable to be created.
+            name: Optional string. The name prefix of the optimizer variable to
+                be created. If not provided, it will be set to `"var"`. The
+                variable name will follow the pattern
+                `{variable_name}_{reference_variable.name}`,
+                e.g., `momemtum/dense_1`. Defaults to `None`.
+            initializer: Initializer object to use to populate the initial
+                variable value, or string name of a built-in initializer
+                (e.g. `"random_normal"`). If unspecified, defaults to
+                `"zeros"`.
+
+        Returns:
+            An optimizer variable, in the format of `keras.Variable`.
+        """
+        name = name or "var"
+        if hasattr(reference_variable, "path"):
+            name = reference_variable.path.replace("/", "_") + "_" + name
+        else:
+            name = (
+                str(reference_variable.name).replace("/", "_").replace(":", "_")
+                + "_"
+                + name
+            )
+        return self.add_variable(
+            shape=reference_variable.shape,
+            initializer=initializer,
+            dtype=reference_variable.dtype,
+            name=name,
+        )
+
+    def _check_variables_are_known(self, variables):
+        for v in variables:
+            if self._var_key(v) not in self._trainable_variables_indices:
+                raise ValueError(
+                    f"Unknown variable: {v}. This optimizer can only "
+                    "be called for the variables it was originally built with. "
+                    "When working with a new set of variables, you should "
+                    "recreate a new optimizer instance."
+                )
+
+    def assign(self, variable, value):
+        """Assign a value to a variable.
+
+        This should be used in optimizers instead of `variable.assign(value)` to
+        support backend specific optimizations.
+        Note that the variable can be a model variable or an optimizer variable;
+        it can be a backend native variable or a Keras variable.
+
+        Args:
+            variable: The variable to update.
+            value: The value to add to the variable.
+        """
+        variable.assign(value)
+
+    def assign_add(self, variable, value):
+        """Add a value to a variable.
+
+        This should be used in optimizers instead of
+        `variable.assign_add(value)` to support backend specific optimizations.
+        Note that the variable can be a model variable or an optimizer variable;
+        it can be a backend native variable or a Keras variable.
+
+        Args:
+            variable: The variable to update.
+            value: The value to add to the variable.
+        """
+        variable.assign_add(value)
+
+    def assign_sub(self, variable, value):
+        """Subtract a value from a variable.
+
+        This should be used in optimizers instead of
+        `variable.assign_sub(value)` to support backend specific optimizations.
+        Note that the variable can be a model variable or an optimizer variable;
+        it can be a backend native variable or a Keras variable.
+
+        Args:
+            variable: The variable to update.
+            value: The value to add to the variable.
+        """
+        variable.assign_sub(value)
+
+    def update_step(self, gradient, variable, learning_rate):
+        raise NotImplementedError
+
+    def apply_gradients(self, grads_and_vars):
+        grads, trainable_variables = zip(*grads_and_vars)
+        self.apply(grads, trainable_variables)
+        # Return iterations for compat with tf.keras.
+        return self._iterations
+
+    def apply(self, grads, trainable_variables=None):
+        """Update traininable variables according to provided gradient values.
+
+        `grads` should be a list of gradient tensors
+        with 1:1 mapping to the list of variables the optimizer was built with.
+
+        `trainable_variables` can be provided
+        on the first call to build the optimizer.
+        """
+        if len(grads) == 0:
+            # It is possible that the grad is empty. In this case,
+            # `apply_gradients` is a no-op.
+            return
+
+        if trainable_variables is None:
+            if not self.built:
+                raise ValueError(
+                    "When passing `grads` without `variables`, the optimizer "
+                    "must already be built on a list of variables. "
+                    "Call `optimizer.build(trainable_variables)` first. "
+                )
+            if len(grads) != len(self._trainable_variables_indices):
+                raise ValueError(
+                    "When passing `grads` as a list of gradient tensors, the "
+                    f"gradients must match `optimizer.variables` one-to-on. "
+                    f"Received a list of {len(grads)} gradients, but the "
+                    f"optimizer is tracking {len(self._trainable_variables)} "
+                    "trainable variables."
+                )
+            trainable_variables = self._trainable_variables
+        else:
+            trainable_variables = list(trainable_variables)
+            # Optionally build optimizer.
+            if not self.built:
+                with backend.name_scope(self.name, caller=self):
+                    self.build(trainable_variables)
+                self.built = True
+            self._check_variables_are_known(trainable_variables)
+
+        with backend.name_scope(self.name, caller=self):
+            # Overwrite targeted variables directly with their gradients if
+            # their `overwrite_with_gradient` is set.
+            grads, trainable_variables = (
+                self._overwrite_variables_directly_with_gradients(
+                    grads, trainable_variables
+                )
+            )
+
+            # Filter empty gradients.
+            grads, trainable_variables = self._filter_empty_gradients(
+                grads, trainable_variables
+            )
+            if len(list(grads)) == 0:
+                return
+
+            # Unscale gradients.
+            scale = self.loss_scale_factor
+            if scale is not None:
+                grads = [g if g is None else g / scale for g in grads]
+
+            # Apply gradient updates.
+            self._backend_apply_gradients(grads, trainable_variables)
+            # Apply variable constraints after applying gradients.
+            for variable in trainable_variables:
+                if variable.constraint is not None:
+                    variable.assign(variable.constraint(variable))
+
+    def _backend_apply_gradients(self, grads, trainable_variables):
+        """Apply method that can be overridden by different backends.
+
+        JAX overrides it in order to deal with statelessness in gradient
+        accumulation and EMA handling.
+
+        The below implementation is intended to be generally backend-agnostic,
+        but may not work with all backends.
+
+        This method does 4 things:
+        - Call the optimizer's update_step() to update trainable variables
+            and optimizer variables.
+        - Update EMA variables, if EMA is configured.
+        - Update gradient accumulators, if gradient accumulation is configured.
+        - Update the iteration counter.
+        """
+        if self.gradient_accumulation_steps:
+            is_update_step = (
+                self._iterations + 1
+            ) % self.gradient_accumulation_steps == 0
+            # `trainable_variables` might have been filtered in previous
+            # processing steps, so we need to ensure the correct mapping between
+            # `self._accumulated_gradients` and `trainable_variables`
+            acc_grads = [
+                self._accumulated_gradients[self._get_variable_index(v)]
+                for v in trainable_variables
+            ]
+
+            def _update_step_fn(grads, trainable_variables):
+                # Run update step with accumulated grads + reset accumulators
+                steps = self.gradient_accumulation_steps
+                grads = [
+                    (g + acc_g) / steps for g, acc_g in zip(grads, acc_grads)
+                ]
+
+                # Apply clipping and weight decay.
+                grads = self._clip_gradients(grads)
+                self._apply_weight_decay(trainable_variables)
+
+                self._backend_update_step(
+                    grads, trainable_variables, self.learning_rate
+                )
+                self._backend_reset_gradient_accumulators()
+
+            ops.cond(
+                is_update_step,
+                lambda: _update_step_fn(grads, trainable_variables),
+                lambda: self._backend_increment_gradient_accumulators(
+                    grads, acc_grads
+                ),
+            )
+        else:
+            # Apply clipping and weight decay.
+            grads = self._clip_gradients(grads)
+            self._apply_weight_decay(trainable_variables)
+
+            # Run update step.
+            self._backend_update_step(
+                grads, trainable_variables, self.learning_rate
+            )
+
+        if self.use_ema:
+            self._update_model_variables_moving_average(
+                self._trainable_variables
+            )
+            if self.ema_overwrite_frequency:
+                # Only when self.ema_overwrite_frequency is not None, we
+                # overwrite the model variables.
+                should_overwrite_model_vars = (
+                    self.iterations + 1
+                ) % self.ema_overwrite_frequency == 0
+                ops.cond(
+                    should_overwrite_model_vars,
+                    lambda: self._overwrite_model_variables_with_average_value(
+                        self._trainable_variables
+                    ),
+                    lambda: None,
+                )
+        # Update iteration counter.
+        self._iterations.assign_add(1)
+
+    def _backend_update_step(self, grads, trainable_variables, learning_rate):
+        """Collective update_step that can be overridden by the backend.
+
+        It is overridden by torch for performance reasons, and
+        by TF to support tf.distribute.
+        """
+        for grad, var in zip(grads, trainable_variables):
+            self.update_step(grad, var, learning_rate)
+
+    def _backend_reset_gradient_accumulators(self):
+        for g_acc in self._accumulated_gradients:
+            g_acc.assign(ops.zeros(g_acc.shape, dtype=g_acc.dtype))
+
+    def _backend_increment_gradient_accumulators(self, grads, acc_grads):
+        new_g_accs = [(g + acc_g) for g, acc_g in zip(grads, acc_grads)]
+        for n_g_acc, g_acc in zip(new_g_accs, acc_grads):
+            g_acc.assign(n_g_acc)
+
+    def stateless_apply(self, optimizer_variables, grads, trainable_variables):
+        self._check_super_called()
+
+        if not self.built:
+            raise ValueError(
+                f"To call `stateless_apply`, {self.__class__.__name__} "
+                "must be built (i.e. its variables must have been created). "
+                "You can build it via `optimizer.build(trainable_variables)`."
+            )
+        if len(optimizer_variables) != len(self.variables):
+            raise ValueError(
+                "Argument `optimizer_variables` must be a list of tensors "
+                f"corresponding 1:1 to {self.__class__.__name__}().variables. "
+                f"Received list with length {len(optimizer_variables)}, but "
+                f"expected {len(self.variables)} variables."
+            )
+        if len(trainable_variables) != len(self._trainable_variables):
+            raise ValueError(
+                "Argument `optimizer_variables` must be a list of tensors "
+                "corresponding 1:1 to the trainable variables list that "
+                "the optimizer was built with. Received "
+                f"len(trainable_variables) == {len(trainable_variables)} "
+                "whereas the optimizer was built with "
+                f"{len(self._trainable_variables)} variables."
+            )
+
+        # Gather variable mapping
+        mapping = list(
+            zip(self._trainable_variables, trainable_variables)
+        ) + list(zip(self.variables, optimizer_variables))
+
+        # Call in stateless scope
+        with backend.StatelessScope(state_mapping=mapping) as scope:
+            self.apply(grads)
+
+        # Gather updated variables
+        trainable_variables = []
+        for v in self._trainable_variables:
+            new_v = scope.get_current_value(v)
+            if new_v is not None:
+                trainable_variables.append(new_v)
+            else:
+                trainable_variables.append(v)
+        optimizer_variables = []
+        for v in self.variables:
+            new_v = scope.get_current_value(v)
+            if new_v is not None:
+                optimizer_variables.append(new_v)
+            else:
+                optimizer_variables.append(v)
+        return trainable_variables, optimizer_variables
+
+    def scale_loss(self, loss):
+        """Scale the loss before computing gradients.
+
+        Scales the loss before gradients are computed in a `train_step`. This
+        is primarily useful during mixed precision training to prevent numeric
+        underflow.
+        """
+        if self.loss_scale_factor is not None:
+            return loss * self.loss_scale_factor
+        return loss
+
+    @property
+    def learning_rate(self):
+        return self._get_current_learning_rate()
+
+    @learning_rate.setter
+    def learning_rate(self, learning_rate):
+        if isinstance(self._learning_rate, backend.Variable):
+            prev_lr_var = self._learning_rate
+        else:
+            prev_lr_var = None
+        if isinstance(
+            learning_rate, learning_rate_schedule.LearningRateSchedule
+        ):
+            self._learning_rate = learning_rate
+        elif callable(learning_rate):
+            self._learning_rate = learning_rate
+        else:
+            if isinstance(
+                self._learning_rate, learning_rate_schedule.LearningRateSchedule
+            ):
+                raise TypeError(
+                    "This optimizer was created with a `LearningRateSchedule`"
+                    " object as its `learning_rate` constructor argument, "
+                    "hence its learning rate is not settable. If you need the"
+                    " learning rate to be settable, you should instantiate "
+                    "the optimizer with a float `learning_rate` argument."
+                )
+            self._learning_rate.assign(learning_rate)
+        if prev_lr_var is not None and not isinstance(
+            self._learning_rate, backend.Variable
+        ):
+            # Untrack learning rate variable
+            self._untrack_variable(prev_lr_var)
+
+    def set_weights(self, weights):
+        """Set the weights of the optimizer."""
+        if not self.built:
+            raise ValueError(
+                "You are calling `set_weights()` on an optimizer that has not "
+                "yet been built. Please call "
+                "`optimizer.build(trainable_variables)` to create the "
+                "optimizer weights before calling `set_weights()`."
+            )
+        for variable, weight in zip(self._variables, weights):
+            if variable.shape != weight.shape:
+                raise ValueError(
+                    f"Optimizer variable {self._var_key(variable)} has shape "
+                    f"{str(variable.shape)} not compatible with provided "
+                    f"weight shape {str(weight.shape)}."
+                )
+            variable.assign(weight)
+
+    def save_own_variables(self, store):
+        """Get the state of this optimizer object."""
+        for i, variable in enumerate(self.variables):
+            store[str(i)] = variable.numpy()
+
+    def load_own_variables(self, store):
+        """Set the state of this optimizer object."""
+        if len(store.keys()) != len(self.variables):
+            msg = (
+                f"Skipping variable loading for optimizer '{self.name}', "
+                f"because it has {len(self.variables)} variables whereas "
+                f"the saved optimizer has {len(store.keys())} variables. "
+            )
+            if len(self.variables) == 0:
+                msg += (
+                    "This is likely because the optimizer has not been "
+                    "called/built yet."
+                )
+            warnings.warn(msg, stacklevel=2)
+            return
+        for i, variable in enumerate(self.variables):
+            variable.assign(store[str(i)])
+
+    def _get_current_learning_rate(self):
+        if isinstance(
+            self._learning_rate, learning_rate_schedule.LearningRateSchedule
+        ):
+            return self._learning_rate(self._iterations)
+        elif callable(self._learning_rate):
+            return self._learning_rate()
+        return self._learning_rate
+
+    def _overwrite_variables_directly_with_gradients(self, grads, vars):
+        """Overwrite the variables directly by their gradients.
+
+        This method is designed for a special case where we want to overwrite
+        the variable directly with its computed gradient. For example, in float8
+        training, new `scale` and `amax_history` are computed as gradients, and
+        we want to overwrite them directly instead of following the typical
+        procedure such as gradient descent with a learning rate, gradient
+        clipping and weight decaying.
+
+        After the update, the processed pairs will be filtered out.
+        """
+        # Shortcut for `tf.Variable` because it doesn't have a
+        # `overwrite_with_gradient` attr
+        if any(not hasattr(v, "overwrite_with_gradient") for v in vars):
+            return grads, vars
+
+        # Shallow copies
+        filtered_grads = list(grads)
+        filtered_vars = list(vars)
+
+        # Iterate from right to left for safe popping
+        for i in range(len(filtered_grads) - 1, -1, -1):
+            g, v = filtered_grads[i], filtered_vars[i]
+            if v.overwrite_with_gradient:
+                if self.gradient_accumulation_steps:
+                    # Utilize a stateless manner for JAX compatibility
+                    steps = self.gradient_accumulation_steps
+                    is_update_step = (self._iterations + 1) % steps == 0
+                    acc_g = self._accumulated_gradients[
+                        self._get_variable_index(v)
+                    ]
+                    # `ops.maximum` is utilized for gradient accumulation for
+                    # `overwrite_with_gradient=True` variables
+                    new_g_acc = ops.cond(
+                        is_update_step,
+                        lambda: ops.zeros(g.shape, dtype=g.dtype),
+                        lambda: ops.maximum(g, acc_g),
+                    )
+                    new_g = ops.cond(
+                        is_update_step,
+                        lambda: ops.maximum(g, acc_g),
+                        lambda: g,
+                    )
+                    new_v = ops.cond(
+                        is_update_step, lambda: new_g, lambda: v.value
+                    )
+                    v.assign(new_v)
+                    acc_g.assign(new_g_acc)
+                else:
+                    v.assign(g)
+                filtered_grads.pop(i)
+                filtered_vars.pop(i)
+        return filtered_grads, filtered_vars
+
+    def _filter_empty_gradients(self, grads, vars):
+        filtered_grads = list(grads)
+        filtered_vars = list(vars)
+        missing_grad_vars = []
+
+        # Iterate from right to left for safe popping
+        for i in range(len(filtered_grads) - 1, -1, -1):
+            if filtered_grads[i] is None:
+                filtered_grads.pop(i)
+                v = filtered_vars.pop(i)
+                try:
+                    missing_grad_vars.append(v.path)
+                except AttributeError:
+                    # `tf.Variable` doesn't have `path` attr.
+                    missing_grad_vars.append(v.name)
+
+        if not filtered_grads:
+            raise ValueError("No gradients provided for any variable.")
+        if missing_grad_vars:
+            warnings.warn(
+                "Gradients do not exist for variables "
+                f"{list(reversed(missing_grad_vars))} when minimizing the loss."
+                " If using `model.compile()`, did you forget to provide a "
+                "`loss` argument?"
+            )
+        return filtered_grads, filtered_vars
+
+    def _clip_gradients(self, grads):
+        if self.clipnorm and self.clipnorm > 0:
+            return [
+                self._clip_by_norm(g) if g is not None else g for g in grads
+            ]
+        elif self.global_clipnorm and self.global_clipnorm > 0:
+            return clip_by_global_norm(grads, self.global_clipnorm)
+        elif self.clipvalue and self.clipvalue > 0:
+            v = self.clipvalue
+            return [ops.clip(g, -v, v) if g is not None else g for g in grads]
+        else:
+            return grads
+
+    def exclude_from_weight_decay(self, var_list=None, var_names=None):
+        """Exclude variables from weight decay.
+
+        This method must be called before the optimizer's `build` method is
+        called. You can set specific variables to exclude out, or set a list of
+        strings as the anchor words, if any of which appear in a variable's
+        name, then the variable is excluded.
+
+        Args:
+            var_list: A list of `Variable`s to exclude from weight decay.
+            var_names: A list of strings. If any string in `var_names` appear
+                in the model variable's name, then this model variable is
+                excluded from weight decay. For example, `var_names=['bias']`
+                excludes all bias variables from weight decay.
+        """
+        if hasattr(self, "_built") and self._built:
+            raise ValueError(
+                "`exclude_from_weight_decay()` can only be configured before "
+                "the optimizer is built."
+            )
+
+        # Use a `set` for the ids of `var_list` to speed up the searching
+        if var_list:
+            self._exclude_from_weight_decay = set(
+                self._var_key(variable) for variable in var_list
+            )
+        else:
+            self._exclude_from_weight_decay = set()
+
+        # Precompile the pattern for `var_names` to speed up the searching
+        if var_names and len(var_names) > 0:
+            self._exclude_from_weight_decay_pattern = re.compile(
+                "|".join(set(var_names))
+            )
+        else:
+            self._exclude_from_weight_decay_pattern = None
+
+        # Reset cache
+        self._exclude_from_weight_decay_cache = dict()
+
+    def _use_weight_decay(self, variable):
+        variable_id = self._var_key(variable)
+
+        # Immediately return the value if `variable_id` hits the cache
+        if not hasattr(self, "_exclude_from_weight_decay_cache"):
+            self._exclude_from_weight_decay_cache = dict()
+        if variable_id in self._exclude_from_weight_decay_cache:
+            return self._exclude_from_weight_decay_cache[variable_id]
+
+        # Determine whether the variable should apply weight decay or not
+        exclude_from_weight_decay = getattr(
+            self, "_exclude_from_weight_decay", set()
+        )
+        exclude_from_weight_decay_pattern = getattr(
+            self, "_exclude_from_weight_decay_pattern", None
+        )
+        if variable_id in exclude_from_weight_decay:
+            self._exclude_from_weight_decay_cache[variable_id] = False
+            return False
+        if exclude_from_weight_decay_pattern is not None:
+            if (
+                re.search(exclude_from_weight_decay_pattern, variable.name)
+                is not None
+            ):
+                self._exclude_from_weight_decay_cache[variable_id] = False
+                return False
+        self._exclude_from_weight_decay_cache[variable_id] = True
+        return True
+
+    def _apply_weight_decay(self, variables):
+        if self.weight_decay is None:
+            return
+        for variable in variables:
+            if self._use_weight_decay(variable):
+                lr = ops.cast(self.learning_rate, variable.dtype)
+                wd = ops.cast(self.weight_decay, variable.dtype)
+                variable.assign(variable - variable * wd * lr)
+
+    def _check_super_called(self):
+        if not hasattr(self, "_lock"):
+            raise RuntimeError(
+                f"In optimizer '{self.__class__.__name__}', you forgot to call "
+                "`super().__init__()` as the first statement "
+                "in the `__init__()` method. "
+                "Go add it!"
+            )
+
+    def _update_model_variables_moving_average(self, trainable_variables):
+        """Update the stored moving average using the latest value."""
+        if self.use_ema:
+            for var, average in zip(
+                trainable_variables, self._model_variables_moving_average
+            ):
+                not_first_step = ops.not_equal(self.iterations, 0)
+                momentum = (
+                    ops.cast(not_first_step, var.dtype) * self.ema_momentum
+                )
+                average.assign(momentum * average + (1 - momentum) * var)
+
+    def _overwrite_model_variables_with_average_value(
+        self, trainable_variables
+    ):
+        """Overwrite model variables with its moving average."""
+        if len(trainable_variables) != len(
+            self._model_variables_moving_average
+        ):
+            raise ValueError(
+                f"The length of model variables ({len(trainable_variables)}) "
+                "to override does not match the length of model variables "
+                "stored in the optimizer "
+                f"({len(self._model_variables_moving_average)}). Please "
+                "check if the optimizer was called on your model."
+            )
+        for var, average_var in zip(
+            trainable_variables, self._model_variables_moving_average
+        ):
+            var.assign(average_var)
+
+    def finalize_variable_values(self, var_list):
+        """Set the final value of model's trainable variables.
+
+        Sometimes there are some extra steps before ending the variable updates,
+        such as overriding the model variables with its average value.
+
+        Args:
+          var_list: list of model variables.
+        """
+        if self.use_ema:
+            # If the optimizer uses EMA, then when finalizing, we replace the
+            # model variable value with its moving average stored inside
+            # optimizer.
+            self._overwrite_model_variables_with_average_value(var_list)
+
+    def _obj_type(self):
+        return "Optimizer"
+
+    def get_config(self):
+        """Returns the config of the optimizer.
+
+        An optimizer config is a Python dictionary (serializable)
+        containing the configuration of an optimizer.
+        The same optimizer can be reinstantiated later
+        (without any saved state) from this configuration.
+
+        Subclass optimizer should override this method to include other
+        hyperparameters.
+
+        Returns:
+            Python dictionary.
+        """
+
+        if isinstance(
+            self._learning_rate, learning_rate_schedule.LearningRateSchedule
+        ):
+            learning_rate = learning_rate_schedule.serialize(
+                self._learning_rate
+            )
+        elif isinstance(self._learning_rate, backend.Variable):
+            learning_rate = float(self._learning_rate.numpy())
+        elif ops.is_tensor(self._learning_rate):
+            learning_rate = float(self._learning_rate)
+        elif callable(self._learning_rate):
+            learning_rate = serialization_lib.serialize_keras_object(
+                self._learning_rate
+            )
+        else:
+            learning_rate = 0.5
+
+        config = {
+            "name": self.name,
+            "learning_rate": learning_rate,
+            "weight_decay": self.weight_decay,
+            "clipnorm": self.clipnorm,
+            "global_clipnorm": self.global_clipnorm,
+            "clipvalue": self.clipvalue,
+            "use_ema": self.use_ema,
+            "ema_momentum": self.ema_momentum,
+            "ema_overwrite_frequency": self.ema_overwrite_frequency,
+            "loss_scale_factor": self.loss_scale_factor,
+            "gradient_accumulation_steps": self.gradient_accumulation_steps,
+        }
+        return config
+
+    @classmethod
+    def from_config(cls, config, custom_objects=None):
+        """Creates an optimizer from its config.
+
+        This method is the reverse of `get_config`, capable of instantiating the
+        same optimizer from the config dictionary.
+
+        Args:
+            config: A Python dictionary, typically the output of get_config.
+            custom_objects: A Python dictionary mapping names to additional
+              user-defined Python objects needed to recreate this optimizer.
+
+        Returns:
+            An optimizer instance.
+        """
+        if "learning_rate" in config:
+            if isinstance(config["learning_rate"], dict):
+                config["learning_rate"] = (
+                    serialization_lib.deserialize_keras_object(
+                        config["learning_rate"], custom_objects=custom_objects
+                    )
+                )
+        return cls(**config)
+
+    def __setattr__(self, name, value):
+        # Prevent users from attaching state to the
+        # layer before `super()` is called -- since that
+        # state would silently not be tracked.
+        if name != "_lock":
+            self._check_super_called()
+        # Track Variables.
+        if hasattr(self, "_tracker"):
+            value = self._tracker.track(value)
+        return super().__setattr__(name, value)
+
+    def _clip_by_norm(self, values, axes=None):
+        # Calculate L2-norm, clip elements by ratio of clip_norm to L2-norm
+        l2sum = ops.sum(ops.square(values), axes, keepdims=True)
+        pred = l2sum > 0
+        # Two-tap tf.where trick to bypass NaN gradients
+        l2sum_safe = ops.where(pred, l2sum, ops.ones_like(l2sum))
+        l2norm = ops.where(pred, ops.sqrt(l2sum_safe), l2sum)
+        intermediate = ops.multiply(values, self.clipnorm)
+        values_clip = ops.convert_to_tensor(intermediate) / ops.maximum(
+            l2norm, self.clipnorm
+        )
+        return values_clip
+
+    def _untrack_variable(self, variable):
+        previous_lock_state = self._tracker.locked
+        self._tracker.unlock()
+        self._tracker.untrack(variable)
+        if previous_lock_state is True:
+            self._tracker.lock()
+
+
+base_optimizer_keyword_args = """name: String. The name to use
+            for momentum accumulator weights created by
+            the optimizer.
+        weight_decay: Float. If set, weight decay is applied.
+        clipnorm: Float. If set, the gradient of each weight is individually
+            clipped so that its norm is no higher than this value.
+        clipvalue: Float. If set, the gradient of each weight is clipped to be
+            no higher than this value.
+        global_clipnorm: Float. If set, the gradient of all weights is clipped
+            so that their global norm is no higher than this value.
+        use_ema: Boolean, defaults to `False`.
+            If `True`, exponential moving average
+            (EMA) is applied. EMA consists of computing an exponential moving
+            average of the weights of the model (as the weight values change
+            after each training batch), and periodically overwriting the
+            weights with their moving average.
+        ema_momentum: Float, defaults to 0.99. Only used if `use_ema=True`.
+            This is the momentum to use when computing
+            the EMA of the model's weights:
+            `new_average = ema_momentum * old_average + (1 - ema_momentum) *
+            current_variable_value`.
+        ema_overwrite_frequency: Int or None, defaults to None. Only used if
+            `use_ema=True`. Every `ema_overwrite_frequency` steps of iterations,
+            we overwrite the model variable by its moving average.
+            If None, the optimizer
+            does not overwrite model variables in the middle of training,
+            and you need to explicitly overwrite the variables
+            at the end of training by calling
+            `optimizer.finalize_variable_values()` (which updates the model
+            variables in-place). When using the built-in `fit()` training loop,
+            this happens automatically after the last epoch,
+            and you don't need to do anything.
+        loss_scale_factor: Float or `None`. If a float, the scale factor will
+            be multiplied the loss before computing gradients, and the inverse
+            of the scale factor will be multiplied by the gradients before
+            updating variables. Useful for preventing underflow during
+            mixed precision training. Alternately,
+            `keras.optimizers.LossScaleOptimizer` will
+            automatically set a loss scale factor.
+        gradient_accumulation_steps: Int or `None`. If an int, model & optimizer
+            variables will not be updated at every step; instead they will be
+            updated every `gradient_accumulation_steps` steps, using the average
+            value of the gradients since the last update. This is known as
+            "gradient accumulation". This can be useful
+            when your batch size is very small, in order to reduce gradient
+            noise at each update step. EMA frequency will look at "accumulated"
+            iterations value (optimizer steps // gradient_accumulation_steps).
+            Learning rate schedules will look at "real" iterations value
+            (optimizer steps).
+"""
+
+
+def global_norm(value_list):
+    """Computes the global norm of multiple tensors."""
+    squared_norms = [
+        ops.sum(ops.square(v)) for v in value_list if v is not None
+    ]
+    squared_norm = ops.sum(ops.stack(squared_norms))
+    return ops.sqrt(squared_norm)
+
+
+def clip_by_global_norm(value_list, clip_norm):
+    use_norm = global_norm(value_list)
+    # Calculate L2-norm, clip elements by ratio of clip_norm to L2-norm
+    scale_for_finite = clip_norm * ops.minimum(1.0 / use_norm, 1.0 / clip_norm)
+    # If use_norm is any finite number, this is a no-op. For inf/-inf/NaN,
+    # this will make scale NaN.
+    scale = scale_for_finite + (use_norm - use_norm)
+    return [v * scale if v is not None else v for v in value_list]
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/ftrl.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/ftrl.py
new file mode 100644
index 0000000000000000000000000000000000000000..562e2ec03a0806c98ba47a30d2a834eb367cea22
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/ftrl.py
@@ -0,0 +1,249 @@
+from keras.src import initializers
+from keras.src import ops
+from keras.src.api_export import keras_export
+from keras.src.optimizers import optimizer
+
+
+@keras_export(["keras.optimizers.Ftrl"])
+class Ftrl(optimizer.Optimizer):
+    r"""Optimizer that implements the FTRL algorithm.
+
+    "Follow The Regularized Leader" (FTRL) is an optimization algorithm
+    developed at Google for click-through rate prediction in the early 2010s. It
+    is most suitable for shallow models with large and sparse feature spaces.
+    The algorithm is described by
+    [McMahan et al., 2013](https://research.google.com/pubs/archive/41159.pdf).
+    The Keras version has support for both online L2 regularization
+    (the L2 regularization described in the paper
+    above) and shrinkage-type L2 regularization
+    (which is the addition of an L2 penalty to the loss function).
+
+    Initialization:
+
+    ```python
+    n = 0
+    sigma = 0
+    z = 0
+    ```
+
+    Update rule for one variable `w`:
+
+    ```python
+    prev_n = n
+    n = n + g ** 2
+    sigma = (n ** -lr_power - prev_n ** -lr_power) / lr
+    z = z + g - sigma * w
+    if abs(z) < lambda_1:
+      w = 0
+    else:
+      w = (sgn(z) * lambda_1 - z) / ((beta + sqrt(n)) / alpha + lambda_2)
+    ```
+
+    Notation:
+
+    - `lr` is the learning rate
+    - `g` is the gradient for the variable
+    - `lambda_1` is the L1 regularization strength
+    - `lambda_2` is the L2 regularization strength
+    - `lr_power` is the power to scale n.
+
+    Check the documentation for the `l2_shrinkage_regularization_strength`
+    parameter for more details when shrinkage is enabled, in which case gradient
+    is replaced with a gradient with shrinkage.
+
+    Args:
+        learning_rate: A float, a
+            `keras.optimizers.schedules.LearningRateSchedule` instance, or
+            a callable that takes no arguments and returns the actual value to
+            use. The learning rate. Defaults to `0.001`.
+        learning_rate_power: A float value, must be less or equal to zero.
+            Controls how the learning rate decreases during training. Use zero
+            for a fixed learning rate.
+        initial_accumulator_value: The starting value for accumulators. Only
+            zero or positive values are allowed.
+        l1_regularization_strength: A float value, must be greater than or equal
+            to zero. Defaults to `0.0`.
+        l2_regularization_strength: A float value, must be greater than or equal
+            to zero. Defaults to `0.0`.
+        l2_shrinkage_regularization_strength: A float value, must be greater
+            than or equal to zero. This differs from L2 above in that the L2
+            above is a stabilization penalty, whereas this L2 shrinkage is a
+            magnitude penalty. When input is sparse shrinkage will only happen
+            on the active weights.
+        beta: A float value, representing the beta value from the paper.
+            Defaults to `0.0`.
+        {{base_optimizer_keyword_args}}
+    """
+
+    def __init__(
+        self,
+        learning_rate=0.001,
+        learning_rate_power=-0.5,
+        initial_accumulator_value=0.1,
+        l1_regularization_strength=0.0,
+        l2_regularization_strength=0.0,
+        l2_shrinkage_regularization_strength=0.0,
+        beta=0.0,
+        weight_decay=None,
+        clipnorm=None,
+        clipvalue=None,
+        global_clipnorm=None,
+        use_ema=False,
+        ema_momentum=0.99,
+        ema_overwrite_frequency=None,
+        loss_scale_factor=None,
+        gradient_accumulation_steps=None,
+        name="ftrl",
+        **kwargs,
+    ):
+        super().__init__(
+            learning_rate=learning_rate,
+            name=name,
+            weight_decay=weight_decay,
+            clipnorm=clipnorm,
+            clipvalue=clipvalue,
+            global_clipnorm=global_clipnorm,
+            use_ema=use_ema,
+            ema_momentum=ema_momentum,
+            ema_overwrite_frequency=ema_overwrite_frequency,
+            loss_scale_factor=loss_scale_factor,
+            gradient_accumulation_steps=gradient_accumulation_steps,
+            **kwargs,
+        )
+
+        if initial_accumulator_value < 0.0:
+            raise ValueError(
+                "`initial_accumulator_value` needs to be positive or zero. "
+                "Received: initial_accumulator_value="
+                f"{initial_accumulator_value}."
+            )
+        if learning_rate_power > 0.0:
+            raise ValueError(
+                "`learning_rate_power` needs to be negative or zero. Received: "
+                f"learning_rate_power={learning_rate_power}."
+            )
+        if l1_regularization_strength < 0.0:
+            raise ValueError(
+                "`l1_regularization_strength` needs to be positive or zero. "
+                "Received: l1_regularization_strength="
+                f"{l1_regularization_strength}."
+            )
+        if l2_regularization_strength < 0.0:
+            raise ValueError(
+                "`l2_regularization_strength` needs to be positive or zero. "
+                "Received: l2_regularization_strength="
+                f"{l2_regularization_strength}."
+            )
+        if l2_shrinkage_regularization_strength < 0.0:
+            raise ValueError(
+                "`l2_shrinkage_regularization_strength` needs to be positive "
+                "or zero. Received: l2_shrinkage_regularization_strength"
+                f"={l2_shrinkage_regularization_strength}."
+            )
+
+        self.learning_rate_power = learning_rate_power
+        self.initial_accumulator_value = initial_accumulator_value
+        self.l1_regularization_strength = l1_regularization_strength
+        self.l2_regularization_strength = l2_regularization_strength
+        self.l2_shrinkage_regularization_strength = (
+            l2_shrinkage_regularization_strength
+        )
+        self.beta = beta
+
+    def build(self, var_list):
+        """Initialize optimizer variables.
+
+        Args:
+            var_list: list of model variables to build Ftrl variables on.
+        """
+        if self.built:
+            return
+        super().build(var_list)
+        self._accumulators = []
+        self._linears = []
+        for var in var_list:
+            self._accumulators.append(
+                self.add_variable(
+                    shape=var.shape,
+                    dtype=var.dtype,
+                    name="accumulator",
+                    initializer=initializers.Constant(
+                        self.initial_accumulator_value,
+                    ),
+                )
+            )
+            self._linears.append(
+                self.add_variable_from_reference(
+                    reference_variable=var, name="linear"
+                )
+            )
+
+    def update_step(self, gradient, variable, learning_rate):
+        """Update step given gradient and the associated model variable."""
+
+        lr = ops.cast(learning_rate, variable.dtype)
+        gradient = ops.cast(gradient, variable.dtype)
+
+        accum = self._accumulators[self._get_variable_index(variable)]
+        linear = self._linears[self._get_variable_index(variable)]
+
+        lr_power = self.learning_rate_power
+        l2_reg = self.l2_regularization_strength
+        l2_reg = l2_reg + self.beta / (2.0 * lr)
+
+        grad_to_use = ops.add(
+            gradient,
+            ops.multiply(
+                2 * self.l2_shrinkage_regularization_strength, variable
+            ),
+        )
+        new_accum = ops.add(accum, ops.square(gradient))
+        self.assign_add(
+            linear,
+            ops.subtract(
+                grad_to_use,
+                ops.multiply(
+                    ops.divide(
+                        ops.subtract(
+                            ops.power(new_accum, -lr_power),
+                            ops.power(accum, -lr_power),
+                        ),
+                        lr,
+                    ),
+                    variable,
+                ),
+            ),
+        )
+        quadratic = ops.add(
+            ops.divide(ops.power(new_accum, (-lr_power)), lr), 2 * l2_reg
+        )
+        linear_clipped = ops.clip(
+            linear,
+            -self.l1_regularization_strength,
+            self.l1_regularization_strength,
+        )
+        self.assign(
+            variable,
+            ops.divide(ops.subtract(linear_clipped, linear), quadratic),
+        )
+        self.assign(accum, new_accum)
+
+    def get_config(self):
+        config = super().get_config()
+
+        config.update(
+            {
+                "learning_rate_power": self.learning_rate_power,
+                "initial_accumulator_value": self.initial_accumulator_value,
+                "l1_regularization_strength": self.l1_regularization_strength,
+                "l2_regularization_strength": self.l2_regularization_strength,
+                "l2_shrinkage_regularization_strength": self.l2_shrinkage_regularization_strength,  # noqa: E501
+                "beta": self.beta,
+            }
+        )
+        return config
+
+
+Ftrl.__doc__ = Ftrl.__doc__.replace(
+    "{{base_optimizer_keyword_args}}", optimizer.base_optimizer_keyword_args
+)
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/lamb.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/lamb.py
new file mode 100644
index 0000000000000000000000000000000000000000..d79f4109734b1fa73f4f7e09c1eed6b40675f117
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/lamb.py
@@ -0,0 +1,158 @@
+from keras.src import ops
+from keras.src.api_export import keras_export
+from keras.src.optimizers import optimizer
+
+
+@keras_export("keras.optimizers.Lamb")
+class Lamb(optimizer.Optimizer):
+    """Optimizer that implements the Lamb algorithm.
+
+    Lamb is a stochastic gradient descent method that
+    uses layer-wise adaptive moments to adjusts the
+    learning rate for each parameter based on the ratio of the
+    norm of the weight to the norm of the gradient
+    This helps to stabilize the training process and improves convergence
+    especially for large batch sizes.
+
+    Args:
+        learning_rate: A float, a
+            `keras.optimizers.schedules.LearningRateSchedule` instance, or
+            a callable that takes no arguments and returns the actual value to
+            use. The learning rate. Defaults to `0.001`.
+        beta_1: A float value or a constant float tensor, or a callable
+            that takes no arguments and returns the actual value to use. The
+            exponential decay rate for the 1st moment estimates. Defaults to
+            `0.9`.
+        beta_2: A float value or a constant float tensor, or a callable
+            that takes no arguments and returns the actual value to use. The
+            exponential decay rate for the 2nd moment estimates. Defaults to
+            `0.999`.
+        epsilon: A small constant for numerical stability.
+            Defaults to `1e-7`.
+        {{base_optimizer_keyword_args}}
+
+    References:
+        - [Yang et al.](https://arxiv.org/pdf/1904.00962)
+    """
+
+    def __init__(
+        self,
+        learning_rate=0.001,
+        beta_1=0.9,
+        beta_2=0.999,
+        epsilon=1e-7,
+        weight_decay=None,
+        clipnorm=None,
+        clipvalue=None,
+        global_clipnorm=None,
+        use_ema=False,
+        ema_momentum=0.99,
+        ema_overwrite_frequency=None,
+        loss_scale_factor=None,
+        gradient_accumulation_steps=None,
+        name="lamb",
+        **kwargs,
+    ):
+        super().__init__(
+            learning_rate=learning_rate,
+            name=name,
+            weight_decay=weight_decay,
+            clipnorm=clipnorm,
+            clipvalue=clipvalue,
+            global_clipnorm=global_clipnorm,
+            use_ema=use_ema,
+            ema_momentum=ema_momentum,
+            ema_overwrite_frequency=ema_overwrite_frequency,
+            loss_scale_factor=loss_scale_factor,
+            gradient_accumulation_steps=gradient_accumulation_steps,
+            **kwargs,
+        )
+        self.beta_1 = beta_1
+        self.beta_2 = beta_2
+        self.epsilon = epsilon
+
+    def build(self, var_list):
+        """Initialize optimizer variables.
+
+        Lamb optimizer has 2 types of variables: momentums and velocities
+
+        Args:
+            var_list: list of model variables to build Lamb variables on.
+        """
+        if self.built:
+            return
+        super().build(var_list)
+        self._momentums = []
+        self._velocities = []
+        for var in var_list:
+            self._momentums.append(
+                self.add_variable_from_reference(
+                    reference_variable=var, name="momentum"
+                )
+            )
+            self._velocities.append(
+                self.add_variable_from_reference(
+                    reference_variable=var, name="velocity"
+                )
+            )
+
+    def update_step(self, gradient, variable, learning_rate):
+        """Update step given gradient and the associated model variable."""
+        lr = ops.cast(learning_rate, variable.dtype)
+        gradient = ops.cast(gradient, variable.dtype)
+        local_step = ops.cast(self.iterations + 1, variable.dtype)
+
+        beta_1_power = ops.power(
+            ops.cast(self.beta_1, variable.dtype), local_step
+        )
+        beta_2_power = ops.power(
+            ops.cast(self.beta_2, variable.dtype), local_step
+        )
+
+        m = self._momentums[self._get_variable_index(variable)]
+        v = self._velocities[self._get_variable_index(variable)]
+
+        self.assign_add(
+            m, ops.multiply(ops.subtract(gradient, m), 1 - self.beta_1)
+        )
+
+        self.assign_add(
+            v,
+            ops.multiply(
+                ops.subtract(ops.square(gradient), v), 1 - self.beta_2
+            ),
+        )
+
+        m_t_hat = ops.divide(m, (1.0 - beta_1_power))
+        v_sqrt = ops.add(
+            ops.sqrt(ops.divide(v, (1.0 - beta_2_power))), self.epsilon
+        )
+
+        update = ops.divide(m_t_hat, v_sqrt)
+        w_norm = ops.sqrt(ops.sum(ops.power(variable, 2)))
+        g_norm = ops.sqrt(ops.sum(ops.power(update, 2)))
+
+        # ratio = w_norm / g_norm if w_norm > 0 and g_norm > 0 else 1
+        ratio = ops.where(
+            ops.greater(w_norm, 0),
+            ops.where(ops.greater(g_norm, 0), (w_norm / g_norm), 1.0),
+            1.0,
+        )
+
+        self.assign_sub(variable, ratio * lr * update)
+
+    def get_config(self):
+        config = super().get_config()
+        config.update(
+            {
+                "beta_1": self.beta_1,
+                "beta_2": self.beta_2,
+                "epsilon": self.epsilon,
+            }
+        )
+        return config
+
+
+Lamb.__doc__ = Lamb.__doc__.replace(
+    "{{base_optimizer_keyword_args}}", optimizer.base_optimizer_keyword_args
+)
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/lion.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/lion.py
new file mode 100644
index 0000000000000000000000000000000000000000..e9194b042660cfa78415ea67bdac5f1a9a66f6be
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/lion.py
@@ -0,0 +1,142 @@
+from keras.src import ops
+from keras.src.api_export import keras_export
+from keras.src.optimizers import optimizer
+
+
+@keras_export(["keras.optimizers.Lion"])
+class Lion(optimizer.Optimizer):
+    """Optimizer that implements the Lion algorithm.
+
+    The Lion optimizer is a stochastic-gradient-descent method that uses the
+    sign operator to control the magnitude of the update, unlike other adaptive
+    optimizers such as Adam that rely on second-order moments. This make
+    Lion more memory-efficient as it only keeps track of the momentum. According
+    to the authors (see reference), its performance gain over Adam grows with
+    the batch size. Because the update of Lion is produced through the sign
+    operation, resulting in a larger norm, a suitable learning rate for Lion is
+    typically 3-10x smaller than that for AdamW. The weight decay for Lion
+    should be in turn 3-10x larger than that for AdamW to maintain a
+    similar strength (lr * wd).
+
+    Args:
+        learning_rate: A float, a
+            `keras.optimizers.schedules.LearningRateSchedule` instance, or
+            a callable that takes no arguments and returns the actual value to
+            use. The learning rate. Defaults to `0.001`.
+        beta_1: A float value or a constant float tensor, or a callable
+            that takes no arguments and returns the actual value to use. The
+            rate to combine the current gradient and the 1st moment estimate.
+            Defaults to `0.9`.
+        beta_2: A float value or a constant float tensor, or a callable
+            that takes no arguments and returns the actual value to use. The
+            exponential decay rate for the 1st moment estimate. Defaults to
+            `0.99`.
+        {{base_optimizer_keyword_args}}
+
+    References:
+
+    - [Chen et al., 2023](http://arxiv.org/abs/2302.06675)
+    - [Authors' implementation](
+        http://github.com/google/automl/tree/master/lion)
+
+    """
+
+    def __init__(
+        self,
+        learning_rate=0.001,
+        beta_1=0.9,
+        beta_2=0.99,
+        weight_decay=None,
+        clipnorm=None,
+        clipvalue=None,
+        global_clipnorm=None,
+        use_ema=False,
+        ema_momentum=0.99,
+        ema_overwrite_frequency=None,
+        loss_scale_factor=None,
+        gradient_accumulation_steps=None,
+        name="lion",
+        **kwargs,
+    ):
+        super().__init__(
+            learning_rate=learning_rate,
+            name=name,
+            weight_decay=weight_decay,
+            clipnorm=clipnorm,
+            clipvalue=clipvalue,
+            global_clipnorm=global_clipnorm,
+            use_ema=use_ema,
+            ema_momentum=ema_momentum,
+            ema_overwrite_frequency=ema_overwrite_frequency,
+            loss_scale_factor=loss_scale_factor,
+            gradient_accumulation_steps=gradient_accumulation_steps,
+            **kwargs,
+        )
+        self.beta_1 = beta_1
+        self.beta_2 = beta_2
+        if beta_1 <= 0 or beta_1 > 1:
+            raise ValueError(
+                "Argument `beta_1` must be in the [0, 1] range. Otherwise, the "
+                f"optimizer degenerates to SignSGD. Received: beta_1={beta_1}."
+            )
+
+    def build(self, var_list):
+        """Initialize optimizer variables.
+
+        Lion optimizer has one variable `momentums`.
+
+        Args:
+            var_list: list of model variables to build Lion variables on.
+        """
+        if self.built:
+            return
+        super().build(var_list)
+        self._momentums = []
+        for var in var_list:
+            self._momentums.append(
+                self.add_variable_from_reference(
+                    reference_variable=var, name="momentum"
+                )
+            )
+
+    def update_step(self, gradient, variable, learning_rate):
+        """Update step given gradient and the associated model variable."""
+        lr = ops.cast(learning_rate, variable.dtype)
+        gradient = ops.cast(gradient, variable.dtype)
+        beta_1 = ops.cast(self.beta_1, variable.dtype)
+        beta_2 = ops.cast(self.beta_2, variable.dtype)
+        m = self._momentums[self._get_variable_index(variable)]
+
+        self.assign_sub(
+            variable,
+            ops.multiply(
+                lr,
+                ops.sign(
+                    ops.add(
+                        ops.multiply(m, beta_1),
+                        ops.multiply(gradient, (1.0 - beta_1)),
+                    )
+                ),
+            ),
+        )
+        self.assign(
+            m,
+            ops.add(
+                ops.multiply(m, beta_2), ops.multiply(gradient, (1.0 - beta_2))
+            ),
+        )
+
+    def get_config(self):
+        config = super().get_config()
+        config.update(
+            {
+                "beta_1": self.beta_1,
+                "beta_2": self.beta_2,
+            }
+        )
+        return config
+
+
+Lion.__doc__ = Lion.__doc__.replace(
+    "{{base_optimizer_keyword_args}}", optimizer.base_optimizer_keyword_args
+)
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/loss_scale_optimizer.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/loss_scale_optimizer.py
new file mode 100644
index 0000000000000000000000000000000000000000..d7c9712dd56921dd08a2acad0ea804a216581bd5
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/loss_scale_optimizer.py
@@ -0,0 +1,298 @@
+from keras.src import backend
+from keras.src import initializers
+from keras.src import ops
+from keras.src.api_export import keras_export
+from keras.src.optimizers import optimizer
+from keras.src.saving import serialization_lib
+from keras.src.utils import tracking
+
+
+@keras_export(
+    [
+        "keras.optimizers.LossScaleOptimizer",
+        "keras.mixed_precision.LossScaleOptimizer",
+    ]
+)
+class LossScaleOptimizer(optimizer.Optimizer):
+    """An optimizer that dynamically scales the loss to prevent underflow.
+
+    Loss scaling is a technique to prevent numeric underflow in intermediate
+    gradients when float16 is used. To prevent underflow, the loss is multiplied
+    (or "scaled") by a certain factor called the "loss scale", which causes
+    intermediate gradients to be scaled by the loss scale as well. The final
+    gradients are divided (or "unscaled") by the loss scale to bring them back
+    to their original value.
+
+    `LossScaleOptimizer` wraps another optimizer and applies dynamic loss
+    scaling to it. This loss scale is dynamically updated over time as follows:
+    - On any train step, if a nonfinite gradient is encountered, the loss scale
+      is halved, and the train step is skipped.
+    - If `dynamic_growth_steps` have occurred since the last time the loss scale
+      was updated, and no nonfinite gradients have occurred, the loss scale
+      is doubled.
+
+    Args:
+        inner_optimizer: The `keras.optimizers.Optimizer` instance to wrap.
+        initial_scale: Float. The initial loss scale. This scale will be updated
+            during training. It is recommended for this to be a very high
+            number, because a loss scale that is too high gets lowered far more
+            quickly than a loss scale that is too low gets raised.
+        dynamic_growth_steps: Int. How often to update the scale upwards. After
+            every `dynamic_growth_steps` steps with finite gradients, the
+            loss scale is doubled.
+        {{base_optimizer_keyword_args}}
+    """
+
+    def __init__(
+        self,
+        inner_optimizer,
+        initial_scale=2.0**15,
+        dynamic_growth_steps=2000,
+        **kwargs,
+    ):
+        if not kwargs.pop("dynamic", True):
+            raise ValueError(
+                "LossScaleOptimizer no longer supports `dynamic=False`. "
+                "Instead, simply set `loss_scale_factor` directly on the "
+                "`inner_optimizer`."
+            )
+        super().__init__(learning_rate=0.0, **kwargs)
+        self.inner_optimizer = inner_optimizer
+        self.initial_scale = initial_scale
+        self.dynamic_growth_steps = dynamic_growth_steps
+
+    @tracking.no_automatic_dependency_tracking
+    def build(self, var_list):
+        self.step_counter = self.add_variable(
+            shape=(),
+            dtype="int",
+            initializer=initializers.Zeros(),
+            aggregation="none",
+            name="step_counter",
+        )
+        self.dynamic_scale = self.add_variable(
+            shape=(),
+            dtype="float32",
+            initializer=initializers.Constant(self.initial_scale),
+            aggregation="none",
+            name="dynamic_scale",
+        )
+        self.inner_optimizer.build(var_list)
+        self.built = True
+
+    @property
+    def variables(self):
+        return self._variables + self.inner_optimizer.variables
+
+    def stateless_apply(self, optimizer_variables, grads, trainable_variables):
+        if not self.built:
+            raise ValueError(
+                f"To call `stateless_apply`, {self.__class__.__name__} "
+                "must be built (i.e. its variables must have been created). "
+                "You can build it via `optimizer.build(trainable_variables)`."
+            )
+        finite = self.check_finite(grads)
+        return ops.cond(
+            finite,
+            lambda: self._stateless_handle_finite_grads(
+                optimizer_variables, grads, trainable_variables
+            ),
+            lambda: self._stateless_handle_non_finite_grads(
+                optimizer_variables, trainable_variables
+            ),
+        )
+
+    def _stateless_handle_finite_grads(
+        self, optimizer_variables, grads, trainable_variables
+    ):
+        def upscale():
+            mapping = list(zip(self.variables, optimizer_variables))
+            with backend.StatelessScope(state_mapping=mapping) as scope:
+                self.step_counter.assign(0)
+                self.dynamic_scale.assign(self.dynamic_scale * 2.0)
+            return [scope.get_current_value(v) for v in self._variables]
+
+        def increment():
+            mapping = list(zip(self.variables, optimizer_variables))
+            with backend.StatelessScope(state_mapping=mapping) as scope:
+                self.step_counter.assign_add(1)
+            return [scope.get_current_value(v) for v in self._variables]
+
+        mapping = list(zip(self.variables, optimizer_variables))
+        with backend.StatelessScope(state_mapping=mapping):
+            # Potentially upscale loss and reset counter.
+            own_variables = ops.cond(
+                ops.equal(self.step_counter, self.dynamic_growth_steps - 1),
+                upscale,
+                increment,
+            )
+
+            # Unscale gradients.
+            scale = self.dynamic_scale
+            unscaled_grads = [
+                g if g is None else ops.divide(g, scale) for g in grads
+            ]
+            (
+                new_trainable_variables,
+                new_inner_variables,
+            ) = self.inner_optimizer.stateless_apply(
+                self.inner_optimizer.variables,
+                unscaled_grads,
+                trainable_variables,
+            )
+
+        new_optimizer_variables = own_variables + new_inner_variables
+        return new_trainable_variables, new_optimizer_variables
+
+    def _stateless_handle_non_finite_grads(
+        self, optimizer_variables, trainable_variables
+    ):
+        mapping = list(zip(self.variables, optimizer_variables))
+        with backend.StatelessScope(state_mapping=mapping) as scope:
+            self.step_counter.assign(0)
+            self.dynamic_scale.assign(self.dynamic_scale / 2.0)
+        new_optimizer_variables = []
+        for v in self.variables:
+            new_optimizer_variables.append(scope.get_current_value(v))
+        return trainable_variables, new_optimizer_variables
+
+    def apply(self, grads, trainable_variables=None):
+        # Optionally build optimizer.
+        if not self.built:
+            with backend.name_scope(self.name, caller=self):
+                self.build(trainable_variables)
+            self.built = True
+
+        if backend.backend() == "tensorflow":
+            self._tf_apply(grads, trainable_variables)
+        else:
+            self._common_apply(grads, trainable_variables)
+
+    def _stateful_handle_finite_grads(self, grads, trainable_variables):
+        scale = self.dynamic_scale
+        # Unscale gradients.
+        unscaled_grads = [
+            g if g is None else ops.divide(g, scale) for g in grads
+        ]
+        self.inner_optimizer.apply(
+            unscaled_grads, trainable_variables=trainable_variables
+        )
+
+        def upscale():
+            self.step_counter.assign(0)
+            self.dynamic_scale.assign(self.dynamic_scale * 2.0)
+
+        def increment():
+            self.step_counter.assign_add(1)
+
+        # Potentially upscale loss and reset counter.
+        ops.cond(
+            ops.equal(self.step_counter, self.dynamic_growth_steps - 1),
+            upscale,
+            increment,
+        )
+
+    def _stateful_handle_non_finite_grads(self):
+        # If any inf or nan in grads, downscale loss and reset counter.
+        self.step_counter.assign(0)
+        self.dynamic_scale.assign(self.dynamic_scale / 2.0)
+
+    def _common_apply(self, grads, trainable_variables=None):
+        finite = self.check_finite(grads)
+        ops.cond(
+            finite,
+            lambda: self._stateful_handle_finite_grads(
+                grads, trainable_variables
+            ),
+            self._stateful_handle_non_finite_grads,
+        )
+
+    def _tf_apply(self, grads, trainable_variables=None):
+        """Tensorflow specific logic for apply, which handles distribution."""
+        from keras.src.utils.module_utils import tensorflow as tf
+
+        if tf.distribute.in_cross_replica_context():
+            raise ValueError("apply() must be called in a replica context.")
+
+        if tf.__internal__.distribute.strategy_supports_no_merge_call():
+            self._common_apply(grads, trainable_variables=trainable_variables)
+        else:
+
+            def _handle_cross_replica(distribution, grads, trainable_variables):
+                finite_per_replica = (
+                    distribution.extended.call_for_each_replica(
+                        self.check_finite, args=(grads,)
+                    )
+                )
+                # Each replica computed the same `finite` value, since
+                # `grads` is all-reduced across replicas. Arbitrarily take
+                # `finite` from the first replica.
+                finite = distribution.experimental_local_results(
+                    finite_per_replica
+                )[0]
+
+                def apply_fn():
+                    distribution.extended.call_for_each_replica(
+                        self._stateful_handle_finite_grads,
+                        args=(grads, trainable_variables),
+                    )
+
+                # Note: We must call this cond() in a cross-replica context.
+                # DistributionStrategy does not support having a cond in a
+                # replica context with a branch that calls `merge_call`, and
+                # self._optimizer.apply_gradients calls `merge_call`.
+                ops.cond(
+                    finite, apply_fn, self._stateful_handle_non_finite_grads
+                )
+
+            tf.distribute.get_replica_context().merge_call(
+                _handle_cross_replica, args=(grads, trainable_variables)
+            )
+
+    def check_finite(self, grads):
+        tensor_grads = [g for g in grads if g is not None]
+        finite_grads = [ops.all(ops.isfinite(g)) for g in tensor_grads]
+        return ops.all(ops.convert_to_tensor(finite_grads))
+
+    @property
+    def learning_rate(self):
+        return self.inner_optimizer.learning_rate
+
+    @learning_rate.setter
+    def learning_rate(self, learning_rate):
+        self.inner_optimizer.learning_rate = learning_rate
+
+    def scale_loss(self, loss):
+        scale = self.dynamic_scale if self.built else self.initial_scale
+        return loss * scale
+
+    def finalize_variable_values(self, var_list):
+        self.inner_optimizer.finalize_variable_values(var_list)
+
+    def get_config(self):
+        config = super().get_config()
+        inner_optimizer_config = serialization_lib.serialize_keras_object(
+            self.inner_optimizer
+        )
+        config.update(
+            {
+                "inner_optimizer": inner_optimizer_config,
+                "initial_scale": self.initial_scale,
+                "dynamic_growth_steps": self.dynamic_growth_steps,
+            }
+        )
+        del config["learning_rate"]
+        return config
+
+    @classmethod
+    def from_config(cls, config, custom_objects=None):
+        inner_optimizer = serialization_lib.deserialize_keras_object(
+            config.pop("inner_optimizer"),
+            custom_objects=custom_objects,
+        )
+        return cls(inner_optimizer, **config)
+
+
+LossScaleOptimizer.__doc__ = LossScaleOptimizer.__doc__.replace(
+    "{{base_optimizer_keyword_args}}", optimizer.base_optimizer_keyword_args
+)
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/nadam.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/nadam.py
new file mode 100644
index 0000000000000000000000000000000000000000..e307be1119422593374a1468e52cba5b349dcafe
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/nadam.py
@@ -0,0 +1,174 @@
+from keras.src import backend
+from keras.src import ops
+from keras.src.api_export import keras_export
+from keras.src.optimizers import optimizer
+
+
+@keras_export(["keras.optimizers.Nadam"])
+class Nadam(optimizer.Optimizer):
+    """Optimizer that implements the Nadam algorithm.
+
+    Much like Adam is essentially RMSprop with momentum, Nadam is Adam with
+    Nesterov momentum.
+
+    Args:
+        learning_rate: A float, a
+            `keras.optimizers.schedules.LearningRateSchedule` instance, or
+            a callable that takes no arguments and returns the actual value to
+            use. The learning rate. Defaults to `0.001`.
+        beta_1: A float value or a constant float tensor, or a callable
+            that takes no arguments and returns the actual value to use. The
+            exponential decay rate for the 1st moment estimates.
+            Defaults to `0.9`.
+        beta_2: A float value or a constant float tensor, or a callable
+            that takes no arguments and returns the actual value to use. The
+            exponential decay rate for the 2nd moment estimates. Defaults to
+            `0.999`.
+        epsilon: A small constant for numerical stability. This epsilon is
+            "epsilon hat" in the Kingma and Ba paper (in the formula just before
+            Section 2.1), not the epsilon in Algorithm 1 of the paper.
+            Defaults to `1e-7`.
+        {{base_optimizer_keyword_args}}
+
+    Reference:
+
+    - [Dozat, 2015](http://cs229.stanford.edu/proj2015/054_report.pdf).
+
+    """
+
+    def __init__(
+        self,
+        learning_rate=0.001,
+        beta_1=0.9,
+        beta_2=0.999,
+        epsilon=1e-7,
+        weight_decay=None,
+        clipnorm=None,
+        clipvalue=None,
+        global_clipnorm=None,
+        use_ema=False,
+        ema_momentum=0.99,
+        ema_overwrite_frequency=None,
+        loss_scale_factor=None,
+        gradient_accumulation_steps=None,
+        name="nadam",
+        **kwargs,
+    ):
+        super().__init__(
+            learning_rate=learning_rate,
+            name=name,
+            weight_decay=weight_decay,
+            clipnorm=clipnorm,
+            clipvalue=clipvalue,
+            global_clipnorm=global_clipnorm,
+            use_ema=use_ema,
+            ema_momentum=ema_momentum,
+            ema_overwrite_frequency=ema_overwrite_frequency,
+            loss_scale_factor=loss_scale_factor,
+            gradient_accumulation_steps=gradient_accumulation_steps,
+            **kwargs,
+        )
+        self.beta_1 = beta_1
+        self.beta_2 = beta_2
+        self.epsilon = epsilon
+
+    def build(self, var_list):
+        """Initialize optimizer variables.
+
+        Nadam optimizer has 2 types of variables: momentums and velocities.
+
+        Args:
+            var_list: list of model variables to build Nadam variables on.
+        """
+        if self.built:
+            return
+        if var_list:
+            dtype = var_list[0].dtype
+        else:
+            dtype = backend.floatx()
+        super().build(var_list)
+        self._momentums = []
+        self._velocities = []
+        self._u_product = backend.Variable(1.0, dtype=dtype)
+
+        for var in var_list:
+            self._momentums.append(
+                self.add_variable_from_reference(
+                    reference_variable=var, name="momentum"
+                )
+            )
+            self._velocities.append(
+                self.add_variable_from_reference(
+                    reference_variable=var, name="velocity"
+                )
+            )
+
+    def _backend_update_step(self, grads, trainable_variables, learning_rate):
+        dtype = self._u_product.dtype
+        self.assign(
+            self._u_product,
+            self._u_product
+            * self.beta_1
+            * (
+                1.0
+                - 0.5 * ops.power(0.96, ops.cast(self.iterations + 1, dtype))
+            ),
+        )
+        super()._backend_update_step(grads, trainable_variables, learning_rate)
+
+    def update_step(self, gradient, variable, learning_rate):
+        """Update step given gradient and the associated model variable."""
+        var_dtype = variable.dtype
+        lr = ops.cast(learning_rate, var_dtype)
+        gradient = ops.cast(gradient, var_dtype)
+
+        local_step = ops.cast(self.iterations + 1, var_dtype)
+        next_step = ops.cast(self.iterations + 2, var_dtype)
+        decay = ops.cast(0.96, var_dtype)
+        beta_1 = ops.cast(self.beta_1, var_dtype)
+        beta_2 = ops.cast(self.beta_2, var_dtype)
+        u_t = beta_1 * (1.0 - 0.5 * (ops.power(decay, local_step)))
+        u_t_1 = beta_1 * (1.0 - 0.5 * (ops.power(decay, next_step)))
+        u_product_t = ops.cast(self._u_product, var_dtype)
+
+        u_product_t_1 = u_product_t * u_t_1
+        beta_2_power = ops.power(beta_2, local_step)
+
+        m = self._momentums[self._get_variable_index(variable)]
+        v = self._velocities[self._get_variable_index(variable)]
+
+        self.assign_add(
+            m, ops.multiply(ops.subtract(gradient, m), (1 - beta_1))
+        )
+        self.assign_add(
+            v, ops.multiply(ops.subtract(ops.square(gradient), v), (1 - beta_2))
+        )
+        m_hat = ops.add(
+            ops.divide(ops.multiply(u_t_1, m), 1 - u_product_t_1),
+            ops.divide(ops.multiply(1 - u_t, gradient), 1 - u_product_t),
+        )
+        v_hat = ops.divide(v, (1 - beta_2_power))
+
+        self.assign_sub(
+            variable,
+            ops.divide(
+                ops.multiply(m_hat, lr), ops.add(ops.sqrt(v_hat), self.epsilon)
+            ),
+        )
+
+    def get_config(self):
+        config = super().get_config()
+
+        config.update(
+            {
+                "beta_1": self.beta_1,
+                "beta_2": self.beta_2,
+                "epsilon": self.epsilon,
+            }
+        )
+        return config
+
+
+Nadam.__doc__ = Nadam.__doc__.replace(
+    "{{base_optimizer_keyword_args}}", optimizer.base_optimizer_keyword_args
+)
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/optimizer.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/optimizer.py
new file mode 100644
index 0000000000000000000000000000000000000000..c285b814ba740d8e7e3c4089bb8ebe17d46b8d1c
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/optimizer.py
@@ -0,0 +1,27 @@
+from keras.src import backend
+from keras.src.api_export import keras_export
+from keras.src.optimizers import base_optimizer
+
+if backend.backend() == "tensorflow":
+    from keras.src.backend.tensorflow.optimizer import (
+        TFOptimizer as BackendOptimizer,
+    )
+elif backend.backend() == "torch":
+    from keras.src.backend.torch.optimizers import (
+        TorchOptimizer as BackendOptimizer,
+    )
+elif backend.backend() == "jax":
+    from keras.src.backend.jax.optimizer import JaxOptimizer as BackendOptimizer
+else:
+
+    class BackendOptimizer(base_optimizer.BaseOptimizer):
+        pass
+
+
+@keras_export(["keras.Optimizer", "keras.optimizers.Optimizer"])
+class Optimizer(BackendOptimizer, base_optimizer.BaseOptimizer):
+    pass
+
+
+Optimizer.__doc__ = base_optimizer.BaseOptimizer.__doc__
+base_optimizer_keyword_args = base_optimizer.base_optimizer_keyword_args
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/rmsprop.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/rmsprop.py
new file mode 100644
index 0000000000000000000000000000000000000000..384bdc21639ad44fa8f06c17e8b4f26275038b60
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/rmsprop.py
@@ -0,0 +1,180 @@
+from keras.src import ops
+from keras.src.api_export import keras_export
+from keras.src.optimizers import optimizer
+
+
+@keras_export(["keras.optimizers.RMSprop"])
+class RMSprop(optimizer.Optimizer):
+    """Optimizer that implements the RMSprop algorithm.
+
+    The gist of RMSprop is to:
+
+    - Maintain a moving (discounted) average of the square of gradients
+    - Divide the gradient by the root of this average
+
+    This implementation of RMSprop uses plain momentum, not Nesterov momentum.
+
+    The centered version additionally maintains a moving average of the
+    gradients, and uses that average to estimate the variance.
+
+    Args:
+        learning_rate: A float, a
+            `keras.optimizers.schedules.LearningRateSchedule` instance, or
+            a callable that takes no arguments and returns the actual value to
+            use. The learning rate. Defaults to `0.001`.
+        rho: float, defaults to 0.9. Discounting factor for the old gradients.
+        momentum: float, defaults to 0.0. If not 0.0., the optimizer tracks the
+            momentum value, with a decay rate equals to `1 - momentum`.
+        epsilon: A small constant for numerical stability. This epsilon is
+            "epsilon hat" in the Kingma and Ba paper (in the formula just before
+            Section 2.1), not the epsilon in Algorithm 1 of the paper. Defaults
+            to 1e-7.
+        centered: Boolean. If `True`, gradients are normalized by the estimated
+            variance of the gradient; if False, by the uncentered second moment.
+            Setting this to `True` may help with training, but is slightly more
+            expensive in terms of computation and memory. Defaults to `False`.
+        {{base_optimizer_keyword_args}}
+
+    Example:
+
+    >>> opt = keras.optimizers.RMSprop(learning_rate=0.1)
+    >>> var1 = keras.backend.Variable(10.0)
+    >>> loss = lambda: (var1 ** 2) / 2.0  # d(loss) / d(var1) = var1
+    >>> opt.minimize(loss, [var1])
+    >>> var1
+    9.683772
+
+    Reference:
+
+    - [Hinton, 2012](
+        http://www.cs.toronto.edu/~tijmen/csc321/slides/lecture_slides_lec6.pdf)
+    """
+
+    def __init__(
+        self,
+        learning_rate=0.001,
+        rho=0.9,
+        momentum=0.0,
+        epsilon=1e-7,
+        centered=False,
+        weight_decay=None,
+        clipnorm=None,
+        clipvalue=None,
+        global_clipnorm=None,
+        use_ema=False,
+        ema_momentum=0.99,
+        ema_overwrite_frequency=None,
+        loss_scale_factor=None,
+        gradient_accumulation_steps=None,
+        name="rmsprop",
+        **kwargs,
+    ):
+        super().__init__(
+            learning_rate=learning_rate,
+            weight_decay=weight_decay,
+            clipnorm=clipnorm,
+            clipvalue=clipvalue,
+            global_clipnorm=global_clipnorm,
+            use_ema=use_ema,
+            ema_momentum=ema_momentum,
+            ema_overwrite_frequency=ema_overwrite_frequency,
+            loss_scale_factor=loss_scale_factor,
+            gradient_accumulation_steps=gradient_accumulation_steps,
+            name=name,
+            **kwargs,
+        )
+        self.rho = rho
+        self.momentum = momentum
+        self.epsilon = epsilon
+        self.centered = centered
+
+    def build(self, var_list):
+        if self.built:
+            return
+
+        super().build(var_list)
+
+        self._velocities = []
+        for var in var_list:
+            self._velocities.append(
+                self.add_variable_from_reference(var, "velocity")
+            )
+
+        self._momentums = []
+        if self.momentum > 0:
+            for var in var_list:
+                self._momentums.append(
+                    self.add_variable_from_reference(var, "momentum")
+                )
+
+        self._average_gradients = []
+        if self.centered:
+            for var in var_list:
+                self._average_gradients.append(
+                    self.add_variable_from_reference(var, "average_gradient")
+                )
+
+    def update_step(self, gradient, variable, learning_rate):
+        """Update step given gradient and the associated model variable."""
+        lr = ops.cast(learning_rate, variable.dtype)
+        gradient = ops.cast(gradient, variable.dtype)
+
+        velocity = self._velocities[self._get_variable_index(variable)]
+        momentum = None
+        if self.momentum > 0:
+            momentum = self._momentums[self._get_variable_index(variable)]
+        average_grad = None
+        if self.centered:
+            average_grad = self._average_gradients[
+                self._get_variable_index(variable)
+            ]
+
+        rho = self.rho
+
+        self.assign(
+            velocity,
+            ops.add(
+                ops.multiply(rho, velocity),
+                ops.multiply(1 - rho, ops.square(gradient)),
+            ),
+        )
+        if self.centered:
+            self.assign(
+                average_grad,
+                ops.add(
+                    ops.multiply(rho, average_grad),
+                    ops.multiply(1 - rho, gradient),
+                ),
+            )
+            denominator = velocity - ops.square(average_grad) + self.epsilon
+        else:
+            denominator = ops.add(velocity, self.epsilon)
+        increment = ops.divide(
+            ops.multiply(lr, gradient), ops.sqrt(denominator)
+        )
+        if self.momentum > 0:
+            self.assign(
+                momentum,
+                ops.add(ops.multiply(self.momentum, momentum), increment),
+            )
+            self.assign_sub(variable, momentum)
+        else:
+            self.assign_sub(variable, increment)
+
+    def get_config(self):
+        config = super().get_config()
+
+        config.update(
+            {
+                "rho": self.rho,
+                "momentum": self.momentum,
+                "epsilon": self.epsilon,
+                "centered": self.centered,
+            }
+        )
+        return config
+
+
+RMSprop.__doc__ = RMSprop.__doc__.replace(
+    "{{base_optimizer_keyword_args}}", optimizer.base_optimizer_keyword_args
+)
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/schedules/__init__.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/schedules/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..a6812ebb08272c839d540079556eb2d6d7ea6fbd
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/schedules/__init__.py
@@ -0,0 +1,16 @@
+from keras.src.optimizers.schedules.learning_rate_schedule import CosineDecay
+from keras.src.optimizers.schedules.learning_rate_schedule import (
+    CosineDecayRestarts,
+)
+from keras.src.optimizers.schedules.learning_rate_schedule import (
+    ExponentialDecay,
+)
+from keras.src.optimizers.schedules.learning_rate_schedule import (
+    InverseTimeDecay,
+)
+from keras.src.optimizers.schedules.learning_rate_schedule import (
+    PiecewiseConstantDecay,
+)
+from keras.src.optimizers.schedules.learning_rate_schedule import (
+    PolynomialDecay,
+)
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/schedules/__pycache__/__init__.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/schedules/__pycache__/__init__.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..12e85e9d481781e776155a2bb99657b3bd8a92d0
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/schedules/__pycache__/__init__.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/schedules/__pycache__/learning_rate_schedule.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/schedules/__pycache__/learning_rate_schedule.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..a54c2f679f44e0edee5da819177365af188428cb
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/schedules/__pycache__/learning_rate_schedule.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/schedules/learning_rate_schedule.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/schedules/learning_rate_schedule.py
new file mode 100644
index 0000000000000000000000000000000000000000..74c13aafbe5303c6328a449e0658ec10cb5d146e
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/schedules/learning_rate_schedule.py
@@ -0,0 +1,969 @@
+"""Various learning rate schedule functions."""
+
+import math
+
+from keras.src import ops
+from keras.src.api_export import keras_export
+from keras.src.saving import serialization_lib
+
+
+@keras_export("keras.optimizers.schedules.LearningRateSchedule")
+class LearningRateSchedule:
+    """The learning rate schedule base class.
+
+    You can use a learning rate schedule to modulate how the learning rate
+    of your optimizer changes over time.
+
+    Several built-in learning rate schedules are available, such as
+    `keras.optimizers.schedules.ExponentialDecay` or
+    `keras.optimizers.schedules.PiecewiseConstantDecay`:
+
+    ```python
+    lr_schedule = keras.optimizers.schedules.ExponentialDecay(
+        initial_learning_rate=1e-2,
+        decay_steps=10000,
+        decay_rate=0.9)
+    optimizer = keras.optimizers.SGD(learning_rate=lr_schedule)
+    ```
+
+    A `LearningRateSchedule` instance can be passed in as the `learning_rate`
+    argument of any optimizer.
+
+    To implement your own schedule object, you should implement the `__call__`
+    method, which takes a `step` argument (scalar integer tensor, the
+    current training step count).
+    Like for any other Keras object, you can also optionally
+    make your object serializable by implementing the `get_config`
+    and `from_config` methods.
+
+    Example:
+
+    ```python
+    class MyLRSchedule(keras.optimizers.schedules.LearningRateSchedule):
+
+        def __init__(self, initial_learning_rate):
+            self.initial_learning_rate = initial_learning_rate
+
+        def __call__(self, step):
+            return self.initial_learning_rate / (step + 1)
+
+    optimizer = keras.optimizers.SGD(learning_rate=MyLRSchedule(0.1))
+    ```
+    """
+
+    def __call__(self, step):
+        raise NotImplementedError(
+            f"Learning rate schedule '{self.__class__.__name__}' "
+            "must override `__call__(self, step)`."
+        )
+
+    def get_config(self):
+        raise NotImplementedError(
+            f"Learning rate schedule '{self.__class__.__name__}' "
+            "must override `get_config()` in order to be serializable."
+        )
+
+    @classmethod
+    def from_config(cls, config):
+        """Instantiates a `LearningRateSchedule` from its config.
+
+        Args:
+            config: Output of `get_config()`.
+
+        Returns:
+            A `LearningRateSchedule` instance.
+        """
+        return cls(**config)
+
+
+@keras_export("keras.optimizers.schedules.ExponentialDecay")
+class ExponentialDecay(LearningRateSchedule):
+    """A `LearningRateSchedule` that uses an exponential decay schedule.
+
+    When training a model, it is often useful to lower the learning rate as
+    the training progresses. This schedule applies an exponential decay function
+    to an optimizer step, given a provided initial learning rate.
+
+    The schedule is a 1-arg callable that produces a decayed learning
+    rate when passed the current optimizer step. This can be useful for changing
+    the learning rate value across different invocations of optimizer functions.
+    It is computed as:
+
+    ```python
+    def decayed_learning_rate(step):
+        return initial_learning_rate * decay_rate ^ (step / decay_steps)
+    ```
+
+    If the argument `staircase` is `True`, then `step / decay_steps` is
+    an integer division and the decayed learning rate follows a
+    staircase function.
+
+    You can pass this schedule directly into a `keras.optimizers.Optimizer`
+    as the learning rate.
+    Example: When fitting a Keras model, decay every 100000 steps with a base
+    of 0.96:
+
+    ```python
+    initial_learning_rate = 0.1
+    lr_schedule = keras.optimizers.schedules.ExponentialDecay(
+        initial_learning_rate,
+        decay_steps=100000,
+        decay_rate=0.96,
+        staircase=True)
+
+    model.compile(optimizer=keras.optimizers.SGD(learning_rate=lr_schedule),
+                  loss='sparse_categorical_crossentropy',
+                  metrics=['accuracy'])
+
+    model.fit(data, labels, epochs=5)
+    ```
+
+    The learning rate schedule is also serializable and deserializable using
+    `keras.optimizers.schedules.serialize` and
+    `keras.optimizers.schedules.deserialize`.
+
+    Args:
+        initial_learning_rate: A Python float. The initial learning rate.
+        decay_steps: A Python integer. Must be positive. See the decay
+            computation above.
+        decay_rate: A Python float. The decay rate.
+        staircase: Boolean.  If `True` decay the learning rate at discrete
+            intervals.
+        name: String.  Optional name of the operation.  Defaults to
+            `"ExponentialDecay`".
+
+    Returns:
+        A 1-arg callable learning rate schedule that takes the current optimizer
+        step and outputs the decayed learning rate, a scalar tensor of the
+        same type as `initial_learning_rate`.
+    """
+
+    def __init__(
+        self,
+        initial_learning_rate,
+        decay_steps,
+        decay_rate,
+        staircase=False,
+        name="ExponentialDecay",
+    ):
+        super().__init__()
+        self.initial_learning_rate = initial_learning_rate
+        self.decay_steps = decay_steps
+        self.decay_rate = decay_rate
+        self.staircase = staircase
+        self.name = name
+
+        if self.decay_steps <= 0:
+            raise ValueError(
+                "Argument `decay_steps` must be > 0. "
+                f"Received: decay_steps={self.decay_steps}"
+            )
+
+    def __call__(self, step):
+        with ops.name_scope(self.name):
+            initial_learning_rate = ops.convert_to_tensor(
+                self.initial_learning_rate
+            )
+            dtype = initial_learning_rate.dtype
+            decay_steps = ops.cast(self.decay_steps, dtype)
+            decay_rate = ops.cast(self.decay_rate, dtype)
+
+            global_step_recomp = ops.cast(step, dtype)
+            p = global_step_recomp / decay_steps
+            if self.staircase:
+                p = ops.floor(p)
+            return ops.multiply(initial_learning_rate, ops.power(decay_rate, p))
+
+    def get_config(self):
+        return {
+            "initial_learning_rate": self.initial_learning_rate,
+            "decay_steps": self.decay_steps,
+            "decay_rate": self.decay_rate,
+            "staircase": self.staircase,
+            "name": self.name,
+        }
+
+
+@keras_export("keras.optimizers.schedules.PiecewiseConstantDecay")
+class PiecewiseConstantDecay(LearningRateSchedule):
+    """A `LearningRateSchedule` that uses a piecewise constant decay schedule.
+
+    The function returns a 1-arg callable to compute the piecewise constant
+    when passed the current optimizer step. This can be useful for changing the
+    learning rate value across different invocations of optimizer functions.
+
+    Example: use a learning rate that's 1.0 for the first 100001 steps, 0.5
+        for the next 10000 steps, and 0.1 for any additional steps.
+
+    ```python
+    step = ops.array(0)
+    boundaries = [100000, 110000]
+    values = [1.0, 0.5, 0.1]
+    learning_rate_fn = keras.optimizers.schedules.PiecewiseConstantDecay(
+        boundaries, values)
+
+    # Later, whenever we perform an optimization step, we pass in the step.
+    learning_rate = learning_rate_fn(step)
+    ```
+
+    You can pass this schedule directly into a `keras.optimizers.Optimizer`
+    as the learning rate. The learning rate schedule is also serializable and
+    deserializable using `keras.optimizers.schedules.serialize` and
+    `keras.optimizers.schedules.deserialize`.
+
+    Args:
+        boundaries: A list of Python numbers with strictly increasing
+            entries, and with all elements having the same type as the
+            optimizer step.
+        values: A list of Python numbers that specifies the values for the
+            intervals defined by `boundaries`. It should have one more
+            element than `boundaries`, and all elements should have the same
+            type.
+        name: A string. Optional name of the operation. Defaults to
+            `"PiecewiseConstant"`.
+
+    Returns:
+        A 1-arg callable learning rate schedule that takes the current optimizer
+        step and outputs the decayed learning rate, a scalar tensor of the
+        same type as the boundary tensors.
+
+        The output of the 1-arg function that takes the `step`
+        is `values[0]` when `step <= boundaries[0]`,
+        `values[1]` when `step > boundaries[0]` and `step <= boundaries[1]`,
+        ..., and `values[-1]` when `step > boundaries[-1]`.
+
+
+    Raises:
+        ValueError: if the number of elements in the `boundaries` and `values`
+        lists do not match.
+    """
+
+    def __init__(self, boundaries, values, name="PiecewiseConstant"):
+        super().__init__()
+
+        if len(boundaries) != len(values) - 1:
+            raise ValueError(
+                "The length of boundaries should be 1 less than the length of "
+                f"values. Received: boundaries={boundaries} of length "
+                f"{len(boundaries)}, and values={values} "
+                f"of length {len(values)}."
+            )
+
+        self.boundaries = boundaries
+        self.values = values
+        self.name = name
+
+    def __call__(self, step):
+        with ops.name_scope(self.name):
+            boundaries = [ops.convert_to_tensor(x) for x in self.boundaries]
+            values = [ops.convert_to_tensor(x) for x in self.values]
+            step = ops.convert_to_tensor(step)
+
+            for i, b in enumerate(boundaries):
+                if b.dtype != step.dtype:
+                    # We cast the boundaries to have the same type as the step
+                    b = ops.cast(b, step.dtype)
+                    boundaries[i] = b
+
+            result_dtype = values[0].dtype
+            result_value = ops.array(0, dtype=result_dtype)
+
+            # For each range between boundaries, we check whether the step is
+            # within that range, cast the resulting boolean to a number,
+            # and multiply the result by the corresponding value for the range.
+            # Taking the sum of these yields a piecewise constant function.
+            step_less_than_first_boundary = ops.cast(
+                step <= boundaries[0], result_dtype
+            )
+            result_value += step_less_than_first_boundary * values[0]
+
+            step_greater_than_last_boundary = ops.cast(
+                step > boundaries[-1], result_dtype
+            )
+            result_value += step_greater_than_last_boundary * values[-1]
+
+            for low, high, value in zip(
+                boundaries[:-1], boundaries[1:], values[1:-1]
+            ):
+                # Need to bind v here; can do this with lambda v=v: ...
+                step_in_range = ops.cast(
+                    (step > low) & (step <= high), result_dtype
+                )
+                result_value += step_in_range * value
+
+            return result_value
+
+    def get_config(self):
+        return {
+            "boundaries": self.boundaries,
+            "values": self.values,
+            "name": self.name,
+        }
+
+
+@keras_export("keras.optimizers.schedules.PolynomialDecay")
+class PolynomialDecay(LearningRateSchedule):
+    """A `LearningRateSchedule` that uses a polynomial decay schedule.
+
+    It is commonly observed that a monotonically decreasing learning rate, whose
+    degree of change is carefully chosen, results in a better performing model.
+    This schedule applies a polynomial decay function to an optimizer step,
+    given a provided `initial_learning_rate`, to reach an `end_learning_rate`
+    in the given `decay_steps`.
+
+    It requires a `step` value to compute the decayed learning rate. You
+    can just pass a backend variable that you increment at each training
+    step.
+
+    The schedule is a 1-arg callable that produces a decayed learning rate
+    when passed the current optimizer step. This can be useful for changing the
+    learning rate value across different invocations of optimizer functions.
+    It is computed as:
+
+    ```python
+    def decayed_learning_rate(step):
+        step = min(step, decay_steps)
+        return ((initial_learning_rate - end_learning_rate) *
+                (1 - step / decay_steps) ^ (power)
+               ) + end_learning_rate
+    ```
+
+    If `cycle` is True then a multiple of `decay_steps` is used, the first one
+    that is bigger than `step`.
+
+    ```python
+    def decayed_learning_rate(step):
+        decay_steps = decay_steps * ceil(step / decay_steps)
+        return ((initial_learning_rate - end_learning_rate) *
+                (1 - step / decay_steps) ^ (power)
+               ) + end_learning_rate
+    ```
+
+    You can pass this schedule directly into a `keras.optimizers.Optimizer`
+    as the learning rate.
+    Example: Fit a model while decaying from 0.1 to 0.01 in 10000 steps using
+    sqrt (i.e. power=0.5):
+
+    ```python
+    ...
+    starter_learning_rate = 0.1
+    end_learning_rate = 0.01
+    decay_steps = 10000
+    learning_rate_fn = keras.optimizers.schedules.PolynomialDecay(
+        starter_learning_rate,
+        decay_steps,
+        end_learning_rate,
+        power=0.5)
+
+    model.compile(optimizer=keras.optimizers.SGD(
+                      learning_rate=learning_rate_fn),
+                  loss='sparse_categorical_crossentropy',
+                  metrics=['accuracy'])
+
+    model.fit(data, labels, epochs=5)
+    ```
+
+    The learning rate schedule is also serializable and deserializable using
+    `keras.optimizers.schedules.serialize` and
+    `keras.optimizers.schedules.deserialize`.
+
+    Args:
+        initial_learning_rate: A Python float. The initial learning rate.
+        decay_steps: A Python integer. Must be positive. See the decay
+            computation above.
+        end_learning_rate: A Python float. The minimal end learning rate.
+        power: A Python float. The power of the polynomial. Defaults to
+            `1.0`.
+        cycle: A boolean, whether it should cycle beyond decay_steps.
+        name: String.  Optional name of the operation. Defaults to
+            `"PolynomialDecay"`.
+
+    Returns:
+        A 1-arg callable learning rate schedule that takes the current optimizer
+        step and outputs the decayed learning rate, a scalar tensor of the
+        same type as `initial_learning_rate`.
+    """
+
+    def __init__(
+        self,
+        initial_learning_rate,
+        decay_steps,
+        end_learning_rate=0.0001,
+        power=1.0,
+        cycle=False,
+        name="PolynomialDecay",
+    ):
+        super().__init__()
+
+        self.initial_learning_rate = initial_learning_rate
+        self.decay_steps = decay_steps
+        self.end_learning_rate = end_learning_rate
+        self.power = power
+        self.cycle = cycle
+        self.name = name
+
+        if self.decay_steps <= 0:
+            raise ValueError(
+                "Argument `decay_steps` must be > 0. "
+                f"Received: decay_steps={self.decay_steps}"
+            )
+
+    def __call__(self, step):
+        with ops.name_scope(self.name):
+            initial_learning_rate = ops.convert_to_tensor(
+                self.initial_learning_rate
+            )
+            dtype = initial_learning_rate.dtype
+            end_learning_rate = ops.cast(self.end_learning_rate, dtype)
+            power = ops.cast(self.power, dtype)
+
+            global_step_recomp = ops.cast(step, dtype)
+            decay_steps_recomp = ops.cast(self.decay_steps, dtype)
+            if self.cycle:
+                # Find the first multiple of decay_steps that is bigger than
+                # global_step. If global_step is zero set the multiplier to 1
+                multiplier = ops.where(
+                    ops.equal(global_step_recomp, 0),
+                    1.0,
+                    ops.ceil(global_step_recomp / self.decay_steps),
+                )
+                decay_steps_recomp = ops.multiply(
+                    decay_steps_recomp, multiplier
+                )
+            else:
+                # Make sure that the global_step used is not bigger than
+                # decay_steps.
+                global_step_recomp = ops.minimum(
+                    global_step_recomp, decay_steps_recomp
+                )
+
+            p = ops.divide(global_step_recomp, decay_steps_recomp)
+            return ops.add(
+                ops.multiply(
+                    initial_learning_rate - end_learning_rate,
+                    ops.power(1 - p, power),
+                ),
+                end_learning_rate,
+            )
+
+    def get_config(self):
+        return {
+            "initial_learning_rate": self.initial_learning_rate,
+            "decay_steps": self.decay_steps,
+            "end_learning_rate": self.end_learning_rate,
+            "power": self.power,
+            "cycle": self.cycle,
+            "name": self.name,
+        }
+
+
+@keras_export("keras.optimizers.schedules.InverseTimeDecay")
+class InverseTimeDecay(LearningRateSchedule):
+    """A `LearningRateSchedule` that uses an inverse time decay schedule.
+
+    When training a model, it is often useful to lower the learning rate as
+    the training progresses. This schedule applies the inverse decay function
+    to an optimizer step, given a provided initial learning rate.
+    It requires a `step` value to compute the decayed learning rate. You can
+    just pass a backend variable that you increment at each training step.
+
+    The schedule is a 1-arg callable that produces a decayed learning
+    rate when passed the current optimizer step. This can be useful for changing
+    the learning rate value across different invocations of optimizer functions.
+    It is computed as:
+
+    ```python
+    def decayed_learning_rate(step):
+        return initial_learning_rate / (1 + decay_rate * step / decay_step)
+    ```
+
+    or, if `staircase` is `True`, as:
+
+    ```python
+    def decayed_learning_rate(step):
+        return initial_learning_rate /
+               (1 + decay_rate * floor(step / decay_step))
+    ```
+
+    You can pass this schedule directly into a `keras.optimizers.Optimizer`
+    as the learning rate.
+    Example: Fit a Keras model when decaying 1/t with a rate of 0.5:
+
+    ```python
+    ...
+    initial_learning_rate = 0.1
+    decay_steps = 1.0
+    decay_rate = 0.5
+    learning_rate_fn = keras.optimizers.schedules.InverseTimeDecay(
+        initial_learning_rate, decay_steps, decay_rate)
+
+    model.compile(optimizer=keras.optimizers.SGD(
+                      learning_rate=learning_rate_fn),
+                  loss='sparse_categorical_crossentropy',
+                  metrics=['accuracy'])
+
+    model.fit(data, labels, epochs=5)
+    ```
+
+    Args:
+        initial_learning_rate: A Python float. The initial learning rate.
+        decay_steps: How often to apply decay.
+        decay_rate: A Python number.  The decay rate.
+        staircase: Whether to apply decay in a discrete staircase, as o
+        pposed to continuous, fashion.
+        name: String.  Optional name of the operation.  Defaults to
+            `"InverseTimeDecay"`.
+
+    Returns:
+        A 1-arg callable learning rate schedule that takes the current optimizer
+        step and outputs the decayed learning rate, a scalar tensor of the
+        same type as `initial_learning_rate`.
+    """
+
+    def __init__(
+        self,
+        initial_learning_rate,
+        decay_steps,
+        decay_rate,
+        staircase=False,
+        name="InverseTimeDecay",
+    ):
+        super().__init__()
+
+        self.initial_learning_rate = initial_learning_rate
+        self.decay_steps = decay_steps
+        self.decay_rate = decay_rate
+        self.staircase = staircase
+        self.name = name
+
+        if self.decay_steps <= 0:
+            raise ValueError(
+                "Argument `decay_steps` must be > 0. "
+                f"Received: decay_steps={self.decay_steps}"
+            )
+
+    def __call__(self, step):
+        with ops.name_scope(self.name):
+            initial_learning_rate = ops.convert_to_tensor(
+                self.initial_learning_rate
+            )
+            dtype = initial_learning_rate.dtype
+            decay_steps = ops.cast(self.decay_steps, dtype)
+            decay_rate = ops.cast(self.decay_rate, dtype)
+
+            global_step_recomp = ops.cast(step, dtype)
+            p = global_step_recomp / decay_steps
+            if self.staircase:
+                p = ops.floor(p)
+            const = ops.cast(ops.array(1), dtype)
+            denom = ops.add(const, ops.multiply(decay_rate, p))
+            return ops.divide(initial_learning_rate, denom)
+
+    def get_config(self):
+        return {
+            "initial_learning_rate": self.initial_learning_rate,
+            "decay_steps": self.decay_steps,
+            "decay_rate": self.decay_rate,
+            "staircase": self.staircase,
+            "name": self.name,
+        }
+
+
+@keras_export("keras.optimizers.schedules.CosineDecay")
+class CosineDecay(LearningRateSchedule):
+    """A `LearningRateSchedule` that uses a cosine decay with optional warmup.
+
+    See [Loshchilov & Hutter, ICLR2016](https://arxiv.org/abs/1608.03983),
+    SGDR: Stochastic Gradient Descent with Warm Restarts.
+
+    For the idea of a linear warmup of our learning rate,
+    see [Goyal et al.](https://arxiv.org/pdf/1706.02677.pdf).
+
+    When we begin training a model, we often want an initial increase in our
+    learning rate followed by a decay. If `warmup_target` is an int, this
+    schedule applies a linear increase per optimizer step to our learning rate
+    from `initial_learning_rate` to `warmup_target` for a duration of
+    `warmup_steps`. Afterwards, it applies a cosine decay function taking our
+    learning rate from `warmup_target` to `alpha` for a duration of
+    `decay_steps`. If `warmup_target` is None we skip warmup and our decay
+    will take our learning rate from `initial_learning_rate` to `alpha`.
+    It requires a `step` value to  compute the learning rate. You can
+    just pass a backend variable that you increment at each training step.
+
+    The schedule is a 1-arg callable that produces a warmup followed by a
+    decayed learning rate when passed the current optimizer step. This can be
+    useful for changing the learning rate value across different invocations of
+    optimizer functions.
+
+    Our warmup is computed as:
+
+    ```python
+    def warmup_learning_rate(step):
+        completed_fraction = step / warmup_steps
+        total_delta = target_warmup - initial_learning_rate
+        return completed_fraction * total_delta
+    ```
+
+    And our decay is computed as:
+
+    ```python
+    if warmup_target is None:
+        initial_decay_lr = initial_learning_rate
+    else:
+        initial_decay_lr = warmup_target
+
+    def decayed_learning_rate(step):
+        step = min(step, decay_steps)
+        cosine_decay = 0.5 * (1 + cos(pi * step / decay_steps))
+        decayed = (1 - alpha) * cosine_decay + alpha
+        return initial_decay_lr * decayed
+    ```
+
+    Example usage without warmup:
+
+    ```python
+    decay_steps = 1000
+    initial_learning_rate = 0.1
+    lr_decayed_fn = keras.optimizers.schedules.CosineDecay(
+        initial_learning_rate, decay_steps)
+    ```
+
+    Example usage with warmup:
+
+    ```python
+    decay_steps = 1000
+    initial_learning_rate = 0
+    warmup_steps = 1000
+    target_learning_rate = 0.1
+    lr_warmup_decayed_fn = keras.optimizers.schedules.CosineDecay(
+        initial_learning_rate, decay_steps, warmup_target=target_learning_rate,
+        warmup_steps=warmup_steps
+    )
+    ```
+
+    You can pass this schedule directly into a `keras.optimizers.Optimizer`
+    as the learning rate. The learning rate schedule is also serializable and
+    deserializable using `keras.optimizers.schedules.serialize` and
+    `keras.optimizers.schedules.deserialize`.
+
+    Args:
+        initial_learning_rate: A Python float. The initial learning rate.
+        decay_steps: A Python int. Number of steps to decay over.
+        alpha: A Python float. Minimum learning rate value for decay as a
+            fraction of `initial_learning_rate`.
+        name: String. Optional name of the operation.  Defaults to
+            `"CosineDecay"`.
+        warmup_target: A Python float. The target learning rate for our
+            warmup phase. Will cast to the `initial_learning_rate` datatype.
+            Setting to `None` will skip warmup and begins decay phase from
+            `initial_learning_rate`. Otherwise scheduler will warmup from
+            `initial_learning_rate` to `warmup_target`.
+        warmup_steps: A Python int. Number of steps to warmup over.
+
+    Returns:
+        A 1-arg callable learning rate schedule that takes the current optimizer
+        step and outputs the decayed learning rate, a scalar tensor of the
+        same type as `initial_learning_rate`.
+    """
+
+    def __init__(
+        self,
+        initial_learning_rate,
+        decay_steps,
+        alpha=0.0,
+        name="CosineDecay",
+        warmup_target=None,
+        warmup_steps=0,
+    ):
+        super().__init__()
+
+        self.initial_learning_rate = initial_learning_rate
+        self.decay_steps = decay_steps
+        self.alpha = alpha
+        self.name = name
+        self.warmup_steps = warmup_steps
+        self.warmup_target = warmup_target
+
+        if self.decay_steps <= 0:
+            raise ValueError(
+                "Argument `decay_steps` must be > 0. "
+                f"Received: decay_steps={self.decay_steps}"
+            )
+
+    def _decay_function(self, step, decay_steps, decay_from_lr, dtype):
+        with ops.name_scope(self.name):
+            completed_fraction = step / decay_steps
+            pi = ops.array(math.pi, dtype=dtype)
+            cosine_decayed = 0.5 * (1.0 + ops.cos(pi * completed_fraction))
+            decayed = (1 - self.alpha) * cosine_decayed + self.alpha
+            return ops.multiply(decay_from_lr, decayed)
+
+    def _warmup_function(
+        self, step, warmup_steps, warmup_target, initial_learning_rate
+    ):
+        with ops.name_scope(self.name):
+            completed_fraction = step / warmup_steps
+            total_step_delta = warmup_target - initial_learning_rate
+            return total_step_delta * completed_fraction + initial_learning_rate
+
+    def __call__(self, step):
+        with ops.name_scope(self.name):
+            initial_learning_rate = ops.convert_to_tensor(
+                self.initial_learning_rate
+            )
+            dtype = initial_learning_rate.dtype
+            decay_steps = ops.cast(self.decay_steps, dtype)
+            global_step_recomp = ops.cast(step, dtype)
+
+            if self.warmup_target is None:
+                global_step_recomp = ops.minimum(
+                    global_step_recomp, decay_steps
+                )
+                return self._decay_function(
+                    global_step_recomp,
+                    decay_steps,
+                    initial_learning_rate,
+                    dtype,
+                )
+
+            warmup_target = ops.cast(self.warmup_target, dtype)
+            warmup_steps = ops.cast(self.warmup_steps, dtype)
+
+            global_step_recomp = ops.minimum(
+                global_step_recomp, decay_steps + warmup_steps
+            )
+
+            return ops.cond(
+                global_step_recomp < warmup_steps,
+                lambda: self._warmup_function(
+                    global_step_recomp,
+                    warmup_steps,
+                    warmup_target,
+                    initial_learning_rate,
+                ),
+                lambda: self._decay_function(
+                    global_step_recomp - warmup_steps,
+                    decay_steps,
+                    warmup_target,
+                    dtype,
+                ),
+            )
+
+    def get_config(self):
+        return {
+            "initial_learning_rate": self.initial_learning_rate,
+            "decay_steps": self.decay_steps,
+            "alpha": self.alpha,
+            "name": self.name,
+            "warmup_target": self.warmup_target,
+            "warmup_steps": self.warmup_steps,
+        }
+
+
+@keras_export("keras.optimizers.schedules.CosineDecayRestarts")
+class CosineDecayRestarts(LearningRateSchedule):
+    """A `LearningRateSchedule` that uses a cosine decay schedule with restarts.
+
+    See [Loshchilov & Hutter, ICLR2016](https://arxiv.org/abs/1608.03983),
+    SGDR: Stochastic Gradient Descent with Warm Restarts.
+
+    When training a model, it is often useful to lower the learning rate as
+    the training progresses. This schedule applies a cosine decay function with
+    restarts to an optimizer step, given a provided initial learning rate.
+    It requires a `step` value to compute the decayed learning rate. You can
+    just pass a backend variable that you increment at each training step.
+
+    The schedule is a 1-arg callable that produces a decayed learning
+    rate when passed the current optimizer step. This can be useful for changing
+    the learning rate value across different invocations of optimizer functions.
+
+    The learning rate multiplier first decays
+    from 1 to `alpha` for `first_decay_steps` steps. Then, a warm
+    restart is performed. Each new warm restart runs for `t_mul` times more
+    steps and with `m_mul` times initial learning rate as the new learning rate.
+
+    Example:
+    ```python
+    first_decay_steps = 1000
+    lr_decayed_fn = (
+        keras.optimizers.schedules.CosineDecayRestarts(
+            initial_learning_rate,
+            first_decay_steps))
+    ```
+
+    You can pass this schedule directly into a `keras.optimizers.Optimizer`
+    as the learning rate. The learning rate schedule is also serializable and
+    deserializable using `keras.optimizers.schedules.serialize` and
+    `keras.optimizers.schedules.deserialize`.
+
+    Args:
+        initial_learning_rate: A Python float. The initial learning rate.
+        first_decay_steps: A Python integer. Number of steps to decay over.
+        t_mul: A Python float. Used to derive the number of iterations in
+            the i-th period.
+        m_mul: A Python float. Used to derive the initial learning rate of
+            the i-th period.
+        alpha: A Python float. Minimum learning rate value as a fraction of
+            the `initial_learning_rate`.
+        name: String. Optional name of the operation. Defaults to
+            `"SGDRDecay"`.
+
+    Returns:
+        A 1-arg callable learning rate schedule that takes the current optimizer
+        step and outputs the decayed learning rate, a scalar tensor of the
+        same type as `initial_learning_rate`.
+    """
+
+    def __init__(
+        self,
+        initial_learning_rate,
+        first_decay_steps,
+        t_mul=2.0,
+        m_mul=1.0,
+        alpha=0.0,
+        name="SGDRDecay",
+    ):
+        super().__init__()
+
+        self.initial_learning_rate = initial_learning_rate
+        self.first_decay_steps = first_decay_steps
+        self._t_mul = t_mul
+        self._m_mul = m_mul
+        self.alpha = alpha
+        self.name = name
+
+        if self.first_decay_steps <= 0:
+            raise ValueError(
+                "Argument `first_decay_steps` must be > 0. "
+                f"Received: first_decay_steps={self.first_decay_steps}"
+            )
+
+    def __call__(self, step):
+        with ops.name_scope(self.name):
+            initial_learning_rate = ops.convert_to_tensor(
+                self.initial_learning_rate
+            )
+            dtype = initial_learning_rate.dtype
+            first_decay_steps = ops.cast(self.first_decay_steps, dtype)
+            alpha = ops.cast(self.alpha, dtype)
+            t_mul = ops.cast(self._t_mul, dtype)
+            m_mul = ops.cast(self._m_mul, dtype)
+
+            global_step_recomp = ops.cast(step, dtype)
+            completed_fraction = global_step_recomp / first_decay_steps
+
+            def compute_step(completed_fraction, geometric=False):
+                """Helper for `cond` operation."""
+                if geometric:
+                    # ops.log is sensitive to the precision of dtype, so we need
+                    # the additional casting
+                    i_restart = ops.floor(
+                        ops.log(
+                            ops.cast(
+                                1.0 - completed_fraction * (1.0 - t_mul), dtype
+                            )
+                        )
+                        / ops.log(t_mul)
+                    )
+
+                    sum_r = (1.0 - t_mul**i_restart) / (1.0 - t_mul)
+                    completed_fraction = (
+                        completed_fraction - sum_r
+                    ) / t_mul**i_restart
+
+                else:
+                    i_restart = ops.floor(completed_fraction)
+                    completed_fraction -= i_restart
+
+                return i_restart, completed_fraction
+
+            i_restart, completed_fraction = ops.cond(
+                ops.equal(t_mul, 1.0),
+                lambda: compute_step(completed_fraction, geometric=False),
+                lambda: compute_step(completed_fraction, geometric=True),
+            )
+
+            m_fac = m_mul**i_restart
+            cosine_decayed = (
+                0.5
+                * m_fac
+                * (
+                    1.0
+                    + ops.cos(
+                        ops.array(math.pi, dtype=dtype) * completed_fraction
+                    )
+                )
+            )
+            decayed = (1 - alpha) * cosine_decayed + alpha
+
+            return ops.multiply(initial_learning_rate, decayed)
+
+    def get_config(self):
+        return {
+            "initial_learning_rate": self.initial_learning_rate,
+            "first_decay_steps": self.first_decay_steps,
+            "t_mul": self._t_mul,
+            "m_mul": self._m_mul,
+            "alpha": self.alpha,
+            "name": self.name,
+        }
+
+
+@keras_export("keras.optimizers.schedules.serialize")
+def serialize(learning_rate_schedule):
+    """Serializes a `LearningRateSchedule` into a JSON-compatible dict.
+
+    Args:
+        learning_rate_schedule: The `LearningRateSchedule` object to serialize.
+
+    Returns:
+        A JSON-serializable dict representing the object's config.
+
+    Example:
+
+    >>> lr_schedule = keras.optimizers.schedules.ExponentialDecay(
+    ...     0.1, decay_steps=100000, decay_rate=0.96, staircase=True)
+    >>> keras.optimizers.schedules.serialize(lr_schedule)
+    {'module': 'keras.optimizers.schedules',
+    'class_name': 'ExponentialDecay', 'config': {...},
+    'registered_name': None}
+    """
+    return serialization_lib.serialize_keras_object(learning_rate_schedule)
+
+
+@keras_export("keras.optimizers.schedules.deserialize")
+def deserialize(config, custom_objects=None):
+    """Instantiates a `LearningRateSchedule` object from a serialized form.
+
+    Args:
+        config: The serialized form of the `LearningRateSchedule`. Dictionary of
+            the form {'class_name': str, 'config': dict}.
+        custom_objects: A dictionary mapping class names (or function names) of
+            custom (non-Keras) objects to class/functions.
+
+    Returns:
+        A `LearningRateSchedule` object.
+
+    Example:
+
+    ```python
+    # Configuration for PolynomialDecay
+    config = {
+        'class_name': 'PolynomialDecay',
+        'config': {'cycle': False,
+            'decay_steps': 10000,
+            'end_learning_rate': 0.01,
+            'initial_learning_rate': 0.1,
+            'name': None,
+            'power': 0.5
+        }
+    }
+    lr_schedule = keras.optimizers.schedules.deserialize(config)
+    ```
+    """
+    return serialization_lib.deserialize_keras_object(
+        config,
+        module_objects=globals(),
+        custom_objects=custom_objects,
+        printable_module_name="decay",
+    )
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/sgd.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/sgd.py
new file mode 100644
index 0000000000000000000000000000000000000000..2a1b9cceba98579021321e1314f733fcd71326c3
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/optimizers/sgd.py
@@ -0,0 +1,143 @@
+from keras.src import ops
+from keras.src.api_export import keras_export
+from keras.src.optimizers import optimizer
+
+
+@keras_export("keras.optimizers.SGD")
+class SGD(optimizer.Optimizer):
+    """Gradient descent (with momentum) optimizer.
+
+    Update rule for parameter `w` with gradient `g` when `momentum` is 0:
+
+    ```python
+    w = w - learning_rate * g
+    ```
+
+    Update rule when `momentum` is larger than 0:
+
+    ```python
+    velocity = momentum * velocity - learning_rate * g
+    w = w + velocity
+    ```
+
+    When `nesterov=True`, this rule becomes:
+
+    ```python
+    velocity = momentum * velocity - learning_rate * g
+    w = w + momentum * velocity - learning_rate * g
+    ```
+
+    Args:
+        learning_rate: A float, a
+            `keras.optimizers.schedules.LearningRateSchedule` instance, or
+            a callable that takes no arguments and returns the actual value to
+            use. The learning rate. Defaults to `0.01`.
+        momentum: float hyperparameter >= 0 that accelerates gradient descent in
+            the relevant direction and dampens oscillations. 0 is vanilla
+            gradient descent. Defaults to `0.0`.
+        nesterov: boolean. Whether to apply Nesterov momentum.
+            Defaults to `False`.
+        {{base_optimizer_keyword_args}}
+    """
+
+    def __init__(
+        self,
+        learning_rate=0.01,
+        momentum=0.0,
+        nesterov=False,
+        weight_decay=None,
+        clipnorm=None,
+        clipvalue=None,
+        global_clipnorm=None,
+        use_ema=False,
+        ema_momentum=0.99,
+        ema_overwrite_frequency=None,
+        loss_scale_factor=None,
+        gradient_accumulation_steps=None,
+        name="SGD",
+        **kwargs,
+    ):
+        super().__init__(
+            learning_rate=learning_rate,
+            name=name,
+            weight_decay=weight_decay,
+            clipnorm=clipnorm,
+            clipvalue=clipvalue,
+            global_clipnorm=global_clipnorm,
+            use_ema=use_ema,
+            ema_momentum=ema_momentum,
+            ema_overwrite_frequency=ema_overwrite_frequency,
+            loss_scale_factor=loss_scale_factor,
+            gradient_accumulation_steps=gradient_accumulation_steps,
+            **kwargs,
+        )
+        if not isinstance(momentum, float) or momentum < 0 or momentum > 1:
+            raise ValueError("`momentum` must be a float between [0, 1].")
+        self.momentum = momentum
+        self.nesterov = nesterov
+
+    def build(self, variables):
+        """Initialize optimizer variables.
+
+        SGD optimizer has one variable `momentums`, only set if `self.momentum`
+        is not 0.
+
+        Args:
+          var_list: list of model variables to build SGD variables on.
+        """
+        if self.built:
+            return
+        super().build(variables)
+        self.momentums = []
+        if self.momentum != 0:
+            for variable in variables:
+                self.momentums.append(
+                    self.add_variable_from_reference(
+                        reference_variable=variable, name="momentum"
+                    )
+                )
+
+    def update_step(self, gradient, variable, learning_rate):
+        """Update step given gradient and the associated model variable."""
+        learning_rate = ops.cast(learning_rate, variable.dtype)
+        gradient = ops.cast(gradient, variable.dtype)
+        m = None
+        if self.momentum != 0:
+            m = self.momentums[self._get_variable_index(variable)]
+
+        if m is not None:
+            momentum = ops.cast(self.momentum, variable.dtype)
+            self.assign(
+                m,
+                ops.subtract(
+                    ops.multiply(m, momentum),
+                    ops.multiply(gradient, learning_rate),
+                ),
+            )
+            if self.nesterov:
+                self.assign_add(
+                    variable,
+                    ops.subtract(
+                        ops.multiply(m, momentum),
+                        ops.multiply(gradient, learning_rate),
+                    ),
+                )
+            else:
+                self.assign_add(variable, m)
+        else:
+            self.assign_sub(variable, ops.multiply(gradient, learning_rate))
+
+    def get_config(self):
+        config = super().get_config()
+        config.update(
+            {
+                "momentum": self.momentum,
+                "nesterov": self.nesterov,
+            }
+        )
+        return config
+
+
+SGD.__doc__ = SGD.__doc__.replace(
+    "{{base_optimizer_keyword_args}}", optimizer.base_optimizer_keyword_args
+)
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/quantizers/__init__.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/quantizers/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..b12d5cc84d7043eba4a6abaf771ff4a8b50d61dd
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/quantizers/__init__.py
@@ -0,0 +1,54 @@
+import inspect
+
+from keras.src.api_export import keras_export
+from keras.src.quantizers.quantizers import AbsMaxQuantizer
+from keras.src.quantizers.quantizers import Quantizer
+from keras.src.quantizers.quantizers import abs_max_quantize
+from keras.src.quantizers.quantizers import compute_float8_amax_history
+from keras.src.quantizers.quantizers import compute_float8_scale
+from keras.src.quantizers.quantizers import quantize_and_dequantize
+from keras.src.saving import serialization_lib
+from keras.src.utils.naming import to_snake_case
+
+ALL_OBJECTS = {Quantizer, AbsMaxQuantizer}
+ALL_OBJECTS_DICT = {cls.__name__: cls for cls in ALL_OBJECTS}
+ALL_OBJECTS_DICT.update(
+    {to_snake_case(cls.__name__): cls for cls in ALL_OBJECTS}
+)
+
+
+@keras_export("keras.quantizers.serialize")
+def serialize(initializer):
+    return serialization_lib.serialize_keras_object(initializer)
+
+
+@keras_export("keras.quantizers.deserialize")
+def deserialize(config, custom_objects=None):
+    """Return a Keras quantizer object via its config."""
+    return serialization_lib.deserialize_keras_object(
+        config,
+        module_objects=ALL_OBJECTS_DICT,
+        custom_objects=custom_objects,
+    )
+
+
+@keras_export("keras.quantizers.get")
+def get(identifier, **kwargs):
+    """Retrieve a Keras quantizer object via an identifier."""
+    if identifier is None:
+        return None
+    if isinstance(identifier, dict):
+        obj = deserialize(identifier)
+    elif isinstance(identifier, str):
+        obj = ALL_OBJECTS_DICT.get(identifier, None)
+    else:
+        obj = identifier
+
+    if callable(obj):
+        if inspect.isclass(obj):
+            obj = obj(kwargs)
+        return obj
+    else:
+        raise ValueError(
+            f"Could not interpret quantizer identifier: {identifier}"
+        )
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/quantizers/__pycache__/__init__.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/quantizers/__pycache__/__init__.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..4c3d8178a1c7b670212ecce3448ffdc81582c2b9
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/quantizers/__pycache__/__init__.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/quantizers/__pycache__/quantizers.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/quantizers/__pycache__/quantizers.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..7e0c3e2e202d51a2446a2c8a21cbcff22a5a786c
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/quantizers/__pycache__/quantizers.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/quantizers/quantizers.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/quantizers/quantizers.py
new file mode 100644
index 0000000000000000000000000000000000000000..3e4aac181e12960b7c5026dda141b39ce2df3a0c
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/quantizers/quantizers.py
@@ -0,0 +1,169 @@
+import ml_dtypes
+import numpy as np
+
+from keras.src import backend
+from keras.src import ops
+from keras.src.api_export import keras_export
+from keras.src.backend.common.backend_utils import standardize_axis_for_numpy
+
+"""Int8-related classes and methods"""
+
+
+@keras_export(["keras.Quantizer", "keras.quantizers.Quantizer"])
+class Quantizer:
+    def __init__(self, output_dtype="int8"):
+        self.output_dtype = output_dtype
+
+    def __call__(self, x):
+        """Compute a quantized output from an input tensor."""
+        return x
+
+    @classmethod
+    def from_config(cls, config):
+        """Creates a quantizer from its config.
+
+        This method is the reverse of `get_config`,
+        capable of instantiating the same quantizer from the config
+        dictionary.
+
+        This method is used by Keras `model_to_estimator`, saving and
+        loading models to HDF5 formats, Keras model cloning, some visualization
+        utilities, and exporting models to and from JSON.
+
+        Args:
+            config: A Python dictionary, typically the output of get_config.
+
+        Returns:
+            A quantizer instance.
+        """
+        return cls(**config)
+
+    def get_config(self):
+        """Returns the config of the quantizer.
+
+        A quantizer config is a Python dictionary (serializable)
+        containing all configuration parameters of the quantizer.
+        The same quantizer can be reinstantiated later
+        (without any saved state) from this configuration.
+
+        This method is optional if you are just training and executing models,
+        exporting to and from SavedModels, or using weight checkpoints.
+
+        This method is required for Keras `model_to_estimator`, saving and
+        loading models to HDF5 formats, Keras model cloning, some visualization
+        utilities, and exporting models to and from JSON.
+
+        Returns:
+            Python dictionary.
+        """
+        raise NotImplementedError(f"{self} does not implement get_config()")
+
+
+@keras_export("keras.quantizers.abs_max_quantize")
+def abs_max_quantize(
+    inputs,
+    axis,
+    value_range=(-127, 127),
+    dtype="int8",
+    epsilon=backend.epsilon(),
+    to_numpy=False,
+):
+    if to_numpy:
+        # Save memory on the device using numpy
+        original_dtype = backend.standardize_dtype(inputs.dtype)
+        inputs = ops.convert_to_numpy(inputs)
+        axis = standardize_axis_for_numpy(axis)
+        scale = np.divide(
+            value_range[1],
+            np.add(np.max(np.abs(inputs), axis=axis, keepdims=True), epsilon),
+        )
+        outputs = np.multiply(inputs, scale)
+        outputs = np.clip(np.round(outputs), value_range[0], value_range[1])
+        outputs = outputs.astype(dtype)
+        return ops.convert_to_tensor(outputs), ops.convert_to_tensor(
+            scale, dtype=original_dtype
+        )
+
+    inputs = ops.convert_to_tensor(inputs)
+    scale = ops.divide(
+        value_range[1],
+        ops.add(ops.max(ops.abs(inputs), axis=axis, keepdims=True), epsilon),
+    )
+    scale = ops.cast(scale, backend.standardize_dtype(inputs.dtype))
+    outputs = ops.multiply(inputs, scale)
+    outputs = ops.clip(ops.round(outputs), value_range[0], value_range[1])
+    outputs = ops.cast(outputs, dtype)
+    return outputs, scale
+
+
+@keras_export("keras.quantizers.AbsMaxQuantizer")
+class AbsMaxQuantizer(Quantizer):
+    def __init__(
+        self,
+        axis,
+        value_range=(-127, 127),
+        epsilon=backend.epsilon(),
+        output_dtype="int8",
+    ):
+        Quantizer.__init__(self, output_dtype=output_dtype)
+        if isinstance(axis, int):
+            axis = (axis,)
+        self.axis = tuple(axis)
+        self.value_range = value_range
+        self.epsilon = epsilon
+
+    def __call__(self, x):
+        quantized_x, scale = abs_max_quantize(
+            x, self.axis, self.value_range, self.output_dtype, self.epsilon
+        )
+        return quantized_x, scale
+
+    def get_config(self):
+        return {
+            "axis": self.axis,
+            "value_range": self.value_range,
+            "epsilon": self.epsilon,
+            "output_dtype": self.output_dtype,
+        }
+
+
+"""Float8-related methods"""
+
+
+@keras_export("keras.quantizers.compute_float8_scale")
+def compute_float8_scale(amax, scale, dtype_max, margin=0):
+    # The algorithm for computing the new scale is sourced from
+    # https://docs.nvidia.com/deeplearning/transformer-engine/user-guide/api/jax.html#transformer_engine.jax.update_fp8_metas
+    # wherein the `original_scale` corresponds to the reciprocal of the
+    # `scale` passed in this function.
+    scale = ops.reciprocal(scale)
+    sf = ops.divide(ops.divide(dtype_max, amax), 2**margin)
+    sf = ops.where(amax > 0.0, sf, scale)
+    sf = ops.where(ops.isfinite(amax), sf, scale)
+    return ops.reciprocal(sf)
+
+
+@keras_export("keras.quantizers.compute_float8_amax_history")
+def compute_float8_amax_history(x, amax_history):
+    amax_update = ops.cast(ops.max(ops.abs(x)), amax_history.dtype)
+    new_amax_history = ops.scatter_update(
+        ops.roll(amax_history, shift=-1),
+        [[0]],
+        ops.reshape(amax_update, [1]),
+    )
+    return new_amax_history
+
+
+@keras_export("keras.quantizers.quantize_and_dequantize")
+def quantize_and_dequantize(inputs, scale, quantized_dtype, compute_dtype):
+    # Quantize
+    quantized_dtype_max = ops.cast(
+        float(ml_dtypes.finfo(quantized_dtype).max), compute_dtype
+    )
+    x = ops.divide(inputs, ops.cast(scale, compute_dtype))
+    x = ops.clip(x, -quantized_dtype_max, quantized_dtype_max)
+    x = ops.cast(x, quantized_dtype)
+
+    # Dequantize
+    x = ops.multiply(ops.cast(x, compute_dtype), ops.cast(scale, compute_dtype))
+    return x
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/random/__init__.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/random/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..4ba54c78837ce944f0278820b6721566a913ea67
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/random/__init__.py
@@ -0,0 +1,9 @@
+from keras.src.random.random import categorical
+from keras.src.random.random import dropout
+from keras.src.random.random import gamma
+from keras.src.random.random import normal
+from keras.src.random.random import randint
+from keras.src.random.random import shuffle
+from keras.src.random.random import truncated_normal
+from keras.src.random.random import uniform
+from keras.src.random.seed_generator import SeedGenerator
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/random/__pycache__/__init__.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/random/__pycache__/__init__.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..8f750d92aafc13fe6733e8d89a6ea1277cbcd068
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/random/__pycache__/__init__.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/random/__pycache__/random.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/random/__pycache__/random.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..0ac53cab8d2607df2e6f2eb3999ce64ffdecf497
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/random/__pycache__/random.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/random/__pycache__/seed_generator.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/random/__pycache__/seed_generator.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..2c3533e9eab3809931a0359408e90098147254e8
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/random/__pycache__/seed_generator.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/random/random.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/random/random.py
new file mode 100644
index 0000000000000000000000000000000000000000..6b65c12ac4b4bceb91cf4ca140930fb5d951e66a
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/random/random.py
@@ -0,0 +1,345 @@
+from keras.src import backend
+from keras.src.api_export import keras_export
+
+
+@keras_export("keras.random.normal")
+def normal(shape, mean=0.0, stddev=1.0, dtype=None, seed=None):
+    """Draw random samples from a normal (Gaussian) distribution.
+
+    Args:
+        shape: The shape of the random values to generate.
+        mean: Float, defaults to 0. Mean of the random values to generate.
+        stddev: Float, defaults to 1. Standard deviation of the random values
+            to generate.
+        dtype: Optional dtype of the tensor. Only floating point types are
+            supported. If not specified, `keras.config.floatx()` is used,
+            which defaults to `float32` unless you configured it otherwise (via
+            `keras.config.set_floatx(float_dtype)`).
+        seed: Optional Python integer or instance of
+           `keras.random.SeedGenerator`.
+            By default, the `seed` argument is `None`, and an internal global
+            `keras.random.SeedGenerator` is used. The `seed` argument can be
+            used to ensure deterministic (repeatable) random number generation.
+            Note that passing an integer as the `seed` value will produce the
+            same random values for each call. To generate different random
+            values for repeated calls, an instance of
+            `keras.random.SeedGenerator` must be provided as the `seed` value.
+            Remark concerning the JAX backend: When tracing functions with the
+            JAX backend the global `keras.random.SeedGenerator` is not
+            supported. Therefore, during tracing the default value `seed=None`
+            will produce an error, and a `seed` argument must be provided.
+    """
+    return backend.random.normal(
+        shape, mean=mean, stddev=stddev, dtype=dtype, seed=seed
+    )
+
+
+@keras_export("keras.random.categorical")
+def categorical(logits, num_samples, dtype="int32", seed=None):
+    """Draws samples from a categorical distribution.
+
+    This function takes as input `logits`, a 2-D input tensor with shape
+    (batch_size, num_classes). Each row of the input represents a categorical
+    distribution, with each column index containing the log-probability for a
+    given class.
+
+    The function will output a 2-D tensor with shape (batch_size, num_samples),
+    where each row contains samples from the corresponding row in `logits`.
+    Each column index contains an independent samples drawn from the input
+    distribution.
+
+    Args:
+        logits: 2-D Tensor with shape (batch_size, num_classes). Each row
+            should define a categorical distribution with the unnormalized
+            log-probabilities for all classes.
+        num_samples: Int, the number of independent samples to draw for each
+            row of the input. This will be the second dimension of the output
+            tensor's shape.
+        dtype: Optional dtype of the output tensor.
+        seed: Optional Python integer or instance of
+           `keras.random.SeedGenerator`.
+            By default, the `seed` argument is `None`, and an internal global
+            `keras.random.SeedGenerator` is used. The `seed` argument can be
+            used to ensure deterministic (repeatable) random number generation.
+            Note that passing an integer as the `seed` value will produce the
+            same random values for each call. To generate different random
+            values for repeated calls, an instance of
+            `keras.random.SeedGenerator` must be provided as the `seed` value.
+            Remark concerning the JAX backend: When tracing functions with the
+            JAX backend the global `keras.random.SeedGenerator` is not
+            supported. Therefore, during tracing the default value seed=None
+            will produce an error, and a `seed` argument must be provided.
+
+    Returns:
+        A 2-D tensor with (batch_size, num_samples).
+    """
+    logits_shape = list(backend.convert_to_tensor(logits).shape)
+    if len(logits_shape) != 2:
+        raise ValueError(
+            "`logits` should be a 2-D tensor with shape "
+            f"[batch_size, num_classes]. Received: logits={logits}"
+        )
+    return backend.random.categorical(
+        logits, num_samples, dtype=dtype, seed=seed
+    )
+
+
+@keras_export("keras.random.uniform")
+def uniform(shape, minval=0.0, maxval=1.0, dtype=None, seed=None):
+    """Draw samples from a uniform distribution.
+
+    The generated values follow a uniform distribution in the range
+    `[minval, maxval)`. The lower bound `minval` is included in the range,
+    while the upper bound `maxval` is excluded.
+
+    `dtype` must be a floating point type, the default range is `[0, 1)`.
+
+    Args:
+        shape: The shape of the random values to generate.
+        minval: Float, defaults to 0. Lower bound of the range of
+            random values to generate (inclusive).
+        maxval: Float, defaults to 1. Upper bound of the range of
+            random values to generate (exclusive).
+        dtype: Optional dtype of the tensor. Only floating point types are
+            supported. If not specified, `keras.config.floatx()` is used,
+            which defaults to `float32` unless you configured it otherwise (via
+            `keras.config.set_floatx(float_dtype)`)
+        seed: Optional Python integer or instance of
+           `keras.random.SeedGenerator`.
+            By default, the `seed` argument is `None`, and an internal global
+            `keras.random.SeedGenerator` is used. The `seed` argument can be
+            used to ensure deterministic (repeatable) random number generation.
+            Note that passing an integer as the `seed` value will produce the
+            same random values for each call. To generate different random
+            values for repeated calls, an instance of
+            `keras.random.SeedGenerator` must be provided as the `seed` value.
+            Remark concerning the JAX backend: When tracing functions with the
+            JAX backend the global `keras.random.SeedGenerator` is not
+            supported. Therefore, during tracing the default value seed=None
+            will produce an error, and a `seed` argument must be provided.
+    """
+    if dtype and not backend.is_float_dtype(dtype):
+        raise ValueError(
+            "`keras.random.uniform` requires a floating point `dtype`. "
+            f"Received: dtype={dtype} "
+        )
+    return backend.random.uniform(
+        shape, minval=minval, maxval=maxval, dtype=dtype, seed=seed
+    )
+
+
+@keras_export("keras.random.randint")
+def randint(shape, minval, maxval, dtype="int32", seed=None):
+    """Draw random integers from a uniform distribution.
+
+    The generated values follow a uniform distribution in the range
+    `[minval, maxval)`. The lower bound `minval` is included in the range,
+    while the upper bound `maxval` is excluded.
+
+    `dtype` must be an integer type.
+
+    Args:
+        shape: The shape of the random values to generate.
+        minval: Float, defaults to 0. Lower bound of the range of
+            random values to generate (inclusive).
+        maxval: Float, defaults to 1. Upper bound of the range of
+            random values to generate (exclusive).
+        dtype: Optional dtype of the tensor. Only integer types are
+            supported. If not specified, `keras.config.floatx()` is used,
+            which defaults to `float32` unless you configured it otherwise (via
+            `keras.config.set_floatx(float_dtype)`)
+        seed: Optional Python integer or instance of
+           `keras.random.SeedGenerator`.
+            By default, the `seed` argument is `None`, and an internal global
+            `keras.random.SeedGenerator` is used. The `seed` argument can be
+            used to ensure deterministic (repeatable) random number generation.
+            Note that passing an integer as the `seed` value will produce the
+            same random values for each call. To generate different random
+            values for repeated calls, an instance of
+            `keras.random.SeedGenerator` must be provided as the `seed` value.
+            Remark concerning the JAX backend: When tracing functions with the
+            JAX backend the global `keras.random.SeedGenerator` is not
+            supported. Therefore, during tracing the default value seed=None
+            will produce an error, and a `seed` argument must be provided.
+    """
+    if dtype and not backend.is_int_dtype(dtype):
+        raise ValueError(
+            "`keras.random.randint` requires an integer `dtype`. "
+            f"Received: dtype={dtype} "
+        )
+    return backend.random.randint(
+        shape, minval=minval, maxval=maxval, dtype=dtype, seed=seed
+    )
+
+
+@keras_export("keras.random.truncated_normal")
+def truncated_normal(shape, mean=0.0, stddev=1.0, dtype=None, seed=None):
+    """Draw samples from a truncated normal distribution.
+
+    The values are drawn from a normal distribution with specified mean and
+    standard deviation, discarding and re-drawing any samples that are more
+    than two standard deviations from the mean.
+
+    Args:
+        shape: The shape of the random values to generate.
+        mean: Float, defaults to 0. Mean of the random values to generate.
+        stddev: Float, defaults to 1. Standard deviation of the random values
+            to generate.
+        dtype: Optional dtype of the tensor. Only floating point types are
+            supported. If not specified, `keras.config.floatx()` is used,
+            which defaults to `float32` unless you configured it otherwise (via
+            `keras.config.set_floatx(float_dtype)`)
+        seed: Optional Python integer or instance of
+           `keras.random.SeedGenerator`.
+            By default, the `seed` argument is `None`, and an internal global
+            `keras.random.SeedGenerator` is used. The `seed` argument can be
+            used to ensure deterministic (repeatable) random number generation.
+            Note that passing an integer as the `seed` value will produce the
+            same random values for each call. To generate different random
+            values for repeated calls, an instance of
+            `keras.random.SeedGenerator` must be provided as the `seed` value.
+            Remark concerning the JAX backend: When tracing functions with the
+            JAX backend the global `keras.random.SeedGenerator` is not
+            supported. Therefore, during tracing the default value seed=None
+            will produce an error, and a `seed` argument must be provided.
+    """
+    return backend.random.truncated_normal(
+        shape, mean=mean, stddev=stddev, dtype=dtype, seed=seed
+    )
+
+
+@keras_export("keras.random.dropout")
+def dropout(inputs, rate, noise_shape=None, seed=None):
+    return backend.random.dropout(
+        inputs, rate, noise_shape=noise_shape, seed=seed
+    )
+
+
+@keras_export("keras.random.shuffle")
+def shuffle(x, axis=0, seed=None):
+    """Shuffle the elements of a tensor uniformly at random along an axis.
+
+    Args:
+        x: The tensor to be shuffled.
+        axis: An integer specifying the axis along which to shuffle. Defaults to
+            `0`.
+        seed: Optional Python integer or instance of
+           `keras.random.SeedGenerator`.
+            By default, the `seed` argument is `None`, and an internal global
+            `keras.random.SeedGenerator` is used. The `seed` argument can be
+            used to ensure deterministic (repeatable) random number generation.
+            Note that passing an integer as the `seed` value will produce the
+            same random values for each call. To generate different random
+            values for repeated calls, an instance of
+            `keras.random.SeedGenerator` must be provided as the `seed` value.
+            Remark concerning the JAX backend: When tracing functions with the
+            JAX backend the global `keras.random.SeedGenerator` is not
+            supported. Therefore, during tracing the default value seed=None
+            will produce an error, and a `seed` argument must be provided.
+    """
+    return backend.random.shuffle(x, axis=axis, seed=seed)
+
+
+@keras_export("keras.random.gamma")
+def gamma(shape, alpha, dtype=None, seed=None):
+    """Draw random samples from the Gamma distribution.
+
+    Args:
+        shape: The shape of the random values to generate.
+        alpha: Float, the parameter of the distribution.
+        dtype: Optional dtype of the tensor. Only floating point types are
+            supported. If not specified, `keras.config.floatx()` is used,
+            which defaults to `float32` unless you configured it otherwise (via
+            `keras.config.set_floatx(float_dtype)`).
+        seed: Optional Python integer or instance of
+           `keras.random.SeedGenerator`.
+            By default, the `seed` argument is `None`, and an internal global
+            `keras.random.SeedGenerator` is used. The `seed` argument can be
+            used to ensure deterministic (repeatable) random number generation.
+            Note that passing an integer as the `seed` value will produce the
+            same random values for each call. To generate different random
+            values for repeated calls, an instance of
+            `keras.random.SeedGenerator` must be provided as the `seed` value.
+            Remark concerning the JAX backend: When tracing functions with the
+            JAX backend the global `keras.random.SeedGenerator` is not
+            supported. Therefore, during tracing the default value seed=None
+            will produce an error, and a `seed` argument must be provided.
+    """
+    return backend.random.gamma(shape, alpha=alpha, dtype=dtype, seed=seed)
+
+
+@keras_export("keras.random.binomial")
+def binomial(shape, counts, probabilities, dtype=None, seed=None):
+    """Draw samples from a Binomial distribution.
+
+    The values are drawn from a Binomial distribution with
+    specified trial count and probability of success.
+
+    Args:
+        shape: The shape of the random values to generate.
+        counts: A number or array of numbers representing the
+            number of trials. It must be broadcastable with `probabilities`.
+        probabilities: A float or array of floats representing the
+            probability of success of an individual event.
+            It must be broadcastable with `counts`.
+        dtype: Optional dtype of the tensor. Only floating point types are
+            supported. If not specified, `keras.config.floatx()` is used,
+            which defaults to `float32` unless you configured it otherwise (via
+            `keras.config.set_floatx(float_dtype)`).
+        seed: Optional Python integer or instance of
+           `keras.random.SeedGenerator`.
+            By default, the `seed` argument is `None`, and an internal global
+            `keras.random.SeedGenerator` is used. The `seed` argument can be
+            used to ensure deterministic (repeatable) random number generation.
+            Note that passing an integer as the `seed` value will produce the
+            same random values for each call. To generate different random
+            values for repeated calls, an instance of
+            `keras.random.SeedGenerator` must be provided as the `seed` value.
+            Remark concerning the JAX backend: When tracing functions with the
+            JAX backend the global `keras.random.SeedGenerator` is not
+            supported. Therefore, during tracing the default value seed=None
+            will produce an error, and a `seed` argument must be provided.
+    """
+    return backend.random.binomial(
+        shape,
+        counts=counts,
+        probabilities=probabilities,
+        dtype=dtype,
+        seed=seed,
+    )
+
+
+@keras_export("keras.random.beta")
+def beta(shape, alpha, beta, dtype=None, seed=None):
+    """Draw samples from a Beta distribution.
+
+    The values are drawn from a Beta distribution parametrized
+    by alpha and beta.
+
+    Args:
+        shape: The shape of the random values to generate.
+        alpha: Float or an array of floats representing the first
+            parameter alpha. Must be broadcastable with `beta` and `shape`.
+        beta: Float or an array of floats representing the second
+            parameter beta. Must be broadcastable with `alpha` and `shape`.
+        dtype: Optional dtype of the tensor. Only floating point types are
+            supported. If not specified, `keras.config.floatx()` is used,
+            which defaults to `float32` unless you configured it otherwise (via
+            `keras.config.set_floatx(float_dtype)`).
+        seed: Optional Python integer or instance of
+           `keras.random.SeedGenerator`.
+            By default, the `seed` argument is `None`, and an internal global
+            `keras.random.SeedGenerator` is used. The `seed` argument can be
+            used to ensure deterministic (repeatable) random number generation.
+            Note that passing an integer as the `seed` value will produce the
+            same random values for each call. To generate different random
+            values for repeated calls, an instance of
+            `keras.random.SeedGenerator` must be provided as the `seed` value.
+            Remark concerning the JAX backend: When tracing functions with the
+            JAX backend the global `keras.random.SeedGenerator` is not
+            supported. Therefore, during tracing the default value seed=None
+            will produce an error, and a `seed` argument must be provided.
+    """
+    return backend.random.beta(
+        shape=shape, alpha=alpha, beta=beta, dtype=dtype, seed=seed
+    )
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/random/seed_generator.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/random/seed_generator.py
new file mode 100644
index 0000000000000000000000000000000000000000..00131e3f4e55e55eda75011d17161b328100a294
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/random/seed_generator.py
@@ -0,0 +1,161 @@
+import random as python_random
+
+import numpy as np
+
+from keras.src import backend
+from keras.src.api_export import keras_export
+from keras.src.backend.common import global_state
+from keras.src.utils import jax_utils
+from keras.src.utils.naming import auto_name
+
+
+@keras_export("keras.random.SeedGenerator")
+class SeedGenerator:
+    """Generates variable seeds upon each call to a function generating
+    random numbers.
+
+    In Keras, all random number generators (such as
+    `keras.random.normal()`) are stateless, meaning that if you pass an
+    integer seed to them (such as `seed=42`), they will return the same
+    values for repeated calls. To get different values for each
+    call, a `SeedGenerator` providing the state of the random generator
+    has to be used.
+
+    Note that all the random number generators have a default seed of None,
+    which implies that an internal global SeedGenerator is used.
+    If you need to decouple the RNG from the global state you can provide
+    a local `StateGenerator` with either a deterministic or random initial
+    state.
+
+    Remark concerning the JAX backen: Note that the use of a local
+    `StateGenerator` as seed argument is required for JIT compilation of
+    RNG with the JAX backend, because the use of global state is not
+    supported.
+
+    Example:
+
+    ```python
+    seed_gen = keras.random.SeedGenerator(seed=42)
+    values = keras.random.normal(shape=(2, 3), seed=seed_gen)
+    new_values = keras.random.normal(shape=(2, 3), seed=seed_gen)
+    ```
+
+    Usage in a layer:
+
+    ```python
+    class Dropout(keras.Layer):
+        def __init__(self, **kwargs):
+            super().__init__(**kwargs)
+            self.seed_generator = keras.random.SeedGenerator(1337)
+
+        def call(self, x, training=False):
+            if training:
+                return keras.random.dropout(
+                    x, rate=0.5, seed=self.seed_generator
+                )
+            return x
+    ```
+    """
+
+    def __init__(self, seed=None, name=None, **kwargs):
+        if name is None:
+            name = auto_name(self.__class__.__name__)
+        self.name = name
+
+        custom_backend = kwargs.pop("backend", None)
+        if kwargs:
+            raise ValueError(f"Unrecognized keyword arguments: {kwargs}")
+        if custom_backend is not None:
+            self.backend = custom_backend
+        else:
+            self.backend = backend
+
+        self._initial_seed = seed
+        if seed is None:
+            seed = make_default_seed()
+
+        if not isinstance(seed, int):
+            raise ValueError(
+                "Argument `seed` must be an integer. " f"Received: seed={seed}"
+            )
+
+        def seed_initializer(*args, **kwargs):
+            dtype = kwargs.get("dtype", None)
+            return self.backend.convert_to_tensor([seed, 0], dtype=dtype)
+
+        with self.backend.name_scope(self.name, caller=self):
+            self.state = self.backend.Variable(
+                seed_initializer,
+                shape=(2,),
+                dtype=self.backend.random_seed_dtype(),
+                trainable=False,
+                aggregation="none",
+                name="seed_generator_state",
+            )
+
+    def next(self, ordered=True):
+        seed_state = self.state
+        # Use * 1 to create a copy
+        new_seed_value = seed_state.value * 1
+        if ordered:
+            increment = self.backend.convert_to_tensor(
+                np.array([0, 1]), dtype=seed_state.dtype
+            )
+            self.state.assign(self.backend.numpy.add(seed_state, increment))
+        else:
+            # This produces a sequence of near-unique numbers
+            # between 0 and 1M
+            self.state.assign((seed_state + 1) * 5387 % 933199)
+        return new_seed_value
+
+    def get_config(self):
+        return {"seed": self._initial_seed}
+
+    @classmethod
+    def from_config(cls, config):
+        return cls(**config)
+
+
+def global_seed_generator():
+    if jax_utils.is_in_jax_tracing_scope():
+        raise ValueError(
+            "[JAX RNG] When tracing a JAX function, "
+            "you should only use seeded random ops, e.g. "
+            "you should create a `SeedGenerator` instance, attach it "
+            "to your layer/model, and pass the instance as the `seed` "
+            "argument when calling random ops. Unseeded random ops "
+            "would get incorrectly traced by JAX and would become constant "
+            "after tracing. Example:\n\n"
+            "```\n"
+            "# Make sure to set the seed generator as a layer attribute\n"
+            "self.seed_generator = keras.random.SeedGenerator(seed=1337)\n"
+            "...\n"
+            "out = keras.random.normal(shape=(1,), seed=self.seed_generator)\n"
+            "```"
+        )
+    gen = global_state.get_global_attribute("global_seed_generator")
+    if gen is None:
+        gen = SeedGenerator()
+        global_state.set_global_attribute("global_seed_generator", gen)
+    return gen
+
+
+def make_default_seed():
+    return python_random.randint(1, int(1e9))
+
+
+def draw_seed(seed):
+    from keras.src.backend import convert_to_tensor
+    from keras.src.backend import random_seed_dtype
+
+    if isinstance(seed, SeedGenerator):
+        return seed.next()
+    elif isinstance(seed, int):
+        return convert_to_tensor([seed, 0], dtype=random_seed_dtype())
+    elif seed is None:
+        return global_seed_generator().next(ordered=False)
+    raise ValueError(
+        "Argument `seed` must be either an integer "
+        "or an instance of `SeedGenerator`. "
+        f"Received: seed={seed} (of type {type(seed)})"
+    )
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/regularizers/__init__.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/regularizers/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..c40bd6ab4549f28e15f0728543bc0f7c5a8eca8d
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/regularizers/__init__.py
@@ -0,0 +1,60 @@
+import inspect
+
+from keras.src.api_export import keras_export
+from keras.src.regularizers.regularizers import L1
+from keras.src.regularizers.regularizers import L1L2
+from keras.src.regularizers.regularizers import L2
+from keras.src.regularizers.regularizers import OrthogonalRegularizer
+from keras.src.regularizers.regularizers import Regularizer
+from keras.src.saving import serialization_lib
+from keras.src.utils.naming import to_snake_case
+
+ALL_OBJECTS = {
+    Regularizer,
+    L1,
+    L2,
+    L1L2,
+    OrthogonalRegularizer,
+}
+
+ALL_OBJECTS_DICT = {cls.__name__: cls for cls in ALL_OBJECTS}
+ALL_OBJECTS_DICT.update(
+    {to_snake_case(cls.__name__): cls for cls in ALL_OBJECTS}
+)
+
+
+@keras_export("keras.regularizers.serialize")
+def serialize(regularizer):
+    return serialization_lib.serialize_keras_object(regularizer)
+
+
+@keras_export("keras.regularizers.deserialize")
+def deserialize(config, custom_objects=None):
+    """Return a Keras regularizer object via its config."""
+    return serialization_lib.deserialize_keras_object(
+        config,
+        module_objects=ALL_OBJECTS_DICT,
+        custom_objects=custom_objects,
+    )
+
+
+@keras_export("keras.regularizers.get")
+def get(identifier):
+    """Retrieve a Keras regularizer object via an identifier."""
+    if identifier is None:
+        return None
+    if isinstance(identifier, dict):
+        obj = deserialize(identifier)
+    elif isinstance(identifier, str):
+        obj = ALL_OBJECTS_DICT.get(identifier, None)
+    else:
+        obj = identifier
+
+    if callable(obj):
+        if inspect.isclass(obj):
+            obj = obj()
+        return obj
+    else:
+        raise ValueError(
+            f"Could not interpret regularizer identifier: {identifier}"
+        )
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/regularizers/__pycache__/__init__.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/regularizers/__pycache__/__init__.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..d4a5f8eabe314579c357799996738d48018765f5
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/regularizers/__pycache__/__init__.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/regularizers/__pycache__/regularizers.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/regularizers/__pycache__/regularizers.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..8d94a1a5d97fa6fde4ae8ada0d789952ff50bcde
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/regularizers/__pycache__/regularizers.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/regularizers/regularizers.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/regularizers/regularizers.py
new file mode 100644
index 0000000000000000000000000000000000000000..99459fe32fb7f7ce3efbed58493a490c06d7012c
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/regularizers/regularizers.py
@@ -0,0 +1,352 @@
+import math
+
+from keras.src import ops
+from keras.src.api_export import keras_export
+from keras.src.utils.numerical_utils import normalize
+
+
+@keras_export(["keras.Regularizer", "keras.regularizers.Regularizer"])
+class Regularizer:
+    """Regularizer base class.
+
+    Regularizers allow you to apply penalties on layer parameters or layer
+    activity during optimization. These penalties are summed into the loss
+    function that the network optimizes.
+
+    Regularization penalties are applied on a per-layer basis. The exact API
+    will depend on the layer, but many layers (e.g. `Dense`, `Conv1D`, `Conv2D`
+    and `Conv3D`) have a unified API.
+
+    These layers expose 3 keyword arguments:
+
+    - `kernel_regularizer`: Regularizer to apply a penalty on the layer's kernel
+    - `bias_regularizer`: Regularizer to apply a penalty on the layer's bias
+    - `activity_regularizer`: Regularizer to apply a penalty on the layer's
+        output
+
+    All layers (including custom layers) expose `activity_regularizer` as a
+    settable property, whether or not it is in the constructor arguments.
+
+    The value returned by the `activity_regularizer` is divided by the input
+    batch size so that the relative weighting between the weight regularizers
+    and the activity regularizers does not change with the batch size.
+
+    You can access a layer's regularization penalties by calling `layer.losses`
+    after calling the layer on inputs.
+
+    ## Example
+
+    >>> layer = Dense(
+    ...     5, input_dim=5,
+    ...     kernel_initializer='ones',
+    ...     kernel_regularizer=L1(0.01),
+    ...     activity_regularizer=L2(0.01))
+    >>> tensor = ops.ones(shape=(5, 5)) * 2.0
+    >>> out = layer(tensor)
+
+    >>> # The kernel regularization term is 0.25
+    >>> # The activity regularization term (after dividing by the batch size)
+    >>> # is 5
+    >>> ops.sum(layer.losses)
+    5.25
+
+    ## Available penalties
+
+    ```python
+    L1(0.3)  # L1 Regularization Penalty
+    L2(0.1)  # L2 Regularization Penalty
+    L1L2(l1=0.01, l2=0.01)  # L1 + L2 penalties
+    ```
+
+    ## Directly calling a regularizer
+
+    Compute a regularization loss on a tensor by directly calling a regularizer
+    as if it is a one-argument function.
+
+    E.g.
+
+    >>> regularizer = L2(2.)
+    >>> tensor = ops.ones(shape=(5, 5))
+    >>> regularizer(tensor)
+    50.0
+
+    ## Developing new regularizers
+
+    Any function that takes in a weight matrix and returns a scalar
+    tensor can be used as a regularizer, e.g.:
+
+    >>> def l1_reg(weight_matrix):
+    ...    return 0.01 * ops.sum(ops.absolute(weight_matrix))
+    ...
+    >>> layer = Dense(5, input_dim=5,
+    ...     kernel_initializer='ones', kernel_regularizer=l1_reg)
+    >>> tensor = ops.ones(shape=(5, 5))
+    >>> out = layer(tensor)
+    >>> layer.losses
+    0.25
+
+    Alternatively, you can write your custom regularizers in an
+    object-oriented way by extending this regularizer base class, e.g.:
+
+    >>> class L2Regularizer(Regularizer):
+    ...   def __init__(self, l2=0.):
+    ...     self.l2 = l2
+    ...
+    ...   def __call__(self, x):
+    ...     return self.l2 * ops.sum(ops.square(x))
+    ...
+    ...   def get_config(self):
+    ...     return {'l2': float(self.l2)}
+    ...
+    >>> layer = Dense(
+    ...   5, input_dim=5, kernel_initializer='ones',
+    ...   kernel_regularizer=L2Regularizer(l2=0.5))
+
+    >>> tensor = ops.ones(shape=(5, 5))
+    >>> out = layer(tensor)
+    >>> layer.losses
+    12.5
+
+    ### A note on serialization and deserialization:
+
+    Registering the regularizers as serializable is optional if you are just
+    training and executing models, exporting to and from SavedModels, or saving
+    and loading weight checkpoints.
+
+    Registration is required for saving and
+    loading models to HDF5 format, Keras model cloning, some visualization
+    utilities, and exporting models to and from JSON. If using this
+    functionality, you must make sure any python process running your model has
+    also defined and registered your custom regularizer.
+    """
+
+    def __call__(self, x):
+        """Compute a regularization penalty from an input tensor."""
+        return 0.0
+
+    @classmethod
+    def from_config(cls, config):
+        """Creates a regularizer from its config.
+
+        This method is the reverse of `get_config`,
+        capable of instantiating the same regularizer from the config
+        dictionary.
+
+        This method is used by Keras `model_to_estimator`, saving and
+        loading models to HDF5 formats, Keras model cloning, some visualization
+        utilities, and exporting models to and from JSON.
+
+        Args:
+            config: A Python dictionary, typically the output of get_config.
+
+        Returns:
+            A regularizer instance.
+        """
+        return cls(**config)
+
+    def get_config(self):
+        """Returns the config of the regularizer.
+
+        An regularizer config is a Python dictionary (serializable)
+        containing all configuration parameters of the regularizer.
+        The same regularizer can be reinstantiated later
+        (without any saved state) from this configuration.
+
+        This method is optional if you are just training and executing models,
+        exporting to and from SavedModels, or using weight checkpoints.
+
+        This method is required for Keras `model_to_estimator`, saving and
+        loading models to HDF5 formats, Keras model cloning, some visualization
+        utilities, and exporting models to and from JSON.
+
+        Returns:
+            Python dictionary.
+        """
+        raise NotImplementedError(f"{self} does not implement get_config()")
+
+
+@keras_export(["keras.regularizers.L1L2", "keras.regularizers.l1_l2"])
+class L1L2(Regularizer):
+    """A regularizer that applies both L1 and L2 regularization penalties.
+
+    The L1 regularization penalty is computed as:
+    `loss = l1 * reduce_sum(abs(x))`
+
+    The L2 regularization penalty is computed as
+    `loss = l2 * reduce_sum(square(x))`
+
+    L1L2 may be passed to a layer as a string identifier:
+
+    >>> dense = Dense(3, kernel_regularizer='l1_l2')
+
+    In this case, the default values used are `l1=0.01` and `l2=0.01`.
+
+    Arguments:
+        l1: float, L1 regularization factor.
+        l2: float, L2 regularization factor.
+    """
+
+    def __init__(self, l1=0.0, l2=0.0):
+        # The default value for l1 and l2 are different from the value in l1_l2
+        # for backward compatibility reason. Eg, L1L2(l2=0.1) will only have l2
+        # and no l1 penalty.
+        l1 = 0.0 if l1 is None else l1
+        l2 = 0.0 if l2 is None else l2
+        validate_float_arg(l1, name="l1")
+        validate_float_arg(l2, name="l2")
+
+        self.l1 = l1
+        self.l2 = l2
+
+    def __call__(self, x):
+        regularization = ops.convert_to_tensor(0.0, dtype=x.dtype)
+        if self.l1:
+            regularization += self.l1 * ops.sum(ops.absolute(x))
+        if self.l2:
+            regularization += self.l2 * ops.sum(ops.square(x))
+        return regularization
+
+    def get_config(self):
+        return {"l1": float(self.l1), "l2": float(self.l2)}
+
+
+@keras_export(["keras.regularizers.L1", "keras.regularizers.l1"])
+class L1(Regularizer):
+    """A regularizer that applies a L1 regularization penalty.
+
+    The L1 regularization penalty is computed as:
+    `loss = l1 * reduce_sum(abs(x))`
+
+    L1 may be passed to a layer as a string identifier:
+
+    >>> dense = Dense(3, kernel_regularizer='l1')
+
+    In this case, the default value used is `l1=0.01`.
+
+    Arguments:
+        l1: float, L1 regularization factor.
+    """
+
+    def __init__(self, l1=0.01):
+        l1 = 0.01 if l1 is None else l1
+        validate_float_arg(l1, name="l1")
+        self.l1 = ops.convert_to_tensor(l1)
+
+    def __call__(self, x):
+        return self.l1 * ops.sum(ops.absolute(x))
+
+    def get_config(self):
+        return {"l1": float(self.l1)}
+
+
+@keras_export(["keras.regularizers.L2", "keras.regularizers.l2"])
+class L2(Regularizer):
+    """A regularizer that applies a L2 regularization penalty.
+
+    The L2 regularization penalty is computed as:
+    `loss = l2 * reduce_sum(square(x))`
+
+    L2 may be passed to a layer as a string identifier:
+
+    >>> dense = Dense(3, kernel_regularizer='l2')
+
+    In this case, the default value used is `l2=0.01`.
+
+    Arguments:
+        l2: float, L2 regularization factor.
+    """
+
+    def __init__(self, l2=0.01):
+        l2 = 0.01 if l2 is None else l2
+        validate_float_arg(l2, name="l2")
+        self.l2 = l2
+
+    def __call__(self, x):
+        return self.l2 * ops.sum(ops.square(x))
+
+    def get_config(self):
+        return {"l2": float(self.l2)}
+
+
+@keras_export(
+    [
+        "keras.regularizers.OrthogonalRegularizer",
+        "keras.regularizers.orthogonal_regularizer",
+    ]
+)
+class OrthogonalRegularizer(Regularizer):
+    """Regularizer that encourages input vectors to be orthogonal to each other.
+
+    It can be applied to either the rows of a matrix (`mode="rows"`) or its
+    columns (`mode="columns"`). When applied to a `Dense` kernel of shape
+    `(input_dim, units)`, rows mode will seek to make the feature vectors
+    (i.e. the basis of the output space) orthogonal to each other.
+
+    Arguments:
+        factor: Float. The regularization factor. The regularization penalty
+            will be proportional to `factor` times the mean of the dot products
+            between the L2-normalized rows (if `mode="rows"`, or columns if
+            `mode="columns"`) of the inputs, excluding the product of each
+            row/column with itself.  Defaults to `0.01`.
+        mode: String, one of `{"rows", "columns"}`. Defaults to `"rows"`. In
+            rows mode, the regularization effect seeks to make the rows of the
+            input orthogonal to each other. In columns mode, it seeks to make
+            the columns of the input orthogonal to each other.
+
+    Example:
+
+    >>> regularizer = OrthogonalRegularizer(factor=0.01)
+    >>> layer = Dense(units=4, kernel_regularizer=regularizer)
+    """
+
+    def __init__(self, factor=0.01, mode="rows"):
+        validate_float_arg(factor, name="factor")
+        self.factor = ops.convert_to_tensor(factor)
+        if mode not in {"rows", "columns"}:
+            raise ValueError(
+                "Invalid value for argument `mode`. Expected one of "
+                f'{{"rows", "columns"}}. Received: mode={mode}'
+            )
+        self.mode = mode
+
+    def __call__(self, inputs):
+        if len(inputs.shape) != 2:
+            raise ValueError(
+                "Inputs to OrthogonalRegularizer must have rank 2. Received: "
+                f"inputs.shape={inputs.shape}"
+            )
+        if self.mode == "rows":
+            inputs = normalize(inputs, axis=1)
+            product = ops.matmul(inputs, ops.transpose(inputs))
+            size = inputs.shape[0]
+        else:
+            inputs = normalize(inputs, axis=0)
+            product = ops.matmul(ops.transpose(inputs), inputs)
+            size = inputs.shape[1]
+        product_no_diagonal = product * (
+            1.0 - ops.eye(size, dtype=inputs.dtype)
+        )
+        num_pairs = size * (size - 1.0) / 2.0
+        return (
+            self.factor
+            * 0.5
+            * ops.sum(ops.absolute(product_no_diagonal))
+            / num_pairs
+        )
+
+    def get_config(self):
+        return {"factor": float(self.factor), "mode": self.mode}
+
+
+def validate_float_arg(value, name):
+    """check penalty number availability, raise ValueError if failed."""
+    if (
+        not isinstance(value, (float, int))
+        or (math.isinf(value) or math.isnan(value))
+        or value < 0
+    ):
+        raise ValueError(
+            f"Invalid value for argument {name}: expected a non-negative float."
+            f"Received: {name}={value}"
+        )
+    return float(value)
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/__init__.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/__init__.py
new file mode 100644
index 0000000000000000000000000000000000000000..3af25ce633afcc1aec7748690d99bb0857d769a2
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/__init__.py
@@ -0,0 +1,9 @@
+from keras.src.saving.object_registration import CustomObjectScope
+from keras.src.saving.object_registration import custom_object_scope
+from keras.src.saving.object_registration import get_custom_objects
+from keras.src.saving.object_registration import get_registered_name
+from keras.src.saving.object_registration import get_registered_object
+from keras.src.saving.object_registration import register_keras_serializable
+from keras.src.saving.saving_api import load_model
+from keras.src.saving.serialization_lib import deserialize_keras_object
+from keras.src.saving.serialization_lib import serialize_keras_object
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/__pycache__/__init__.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/__pycache__/__init__.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..0eba0f7488379619a009029fad51eb66151dd835
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/__pycache__/__init__.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/__pycache__/file_editor.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/__pycache__/file_editor.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..65aa78c1eb26de99f48d7839ccee95800e49b72e
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/__pycache__/file_editor.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/__pycache__/keras_saveable.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/__pycache__/keras_saveable.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..a8f88f092d53d524b80aec6868233190105af597
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/__pycache__/keras_saveable.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/__pycache__/object_registration.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/__pycache__/object_registration.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..1a751ba43055985c284bff826a9a3aeafdc175d9
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/__pycache__/object_registration.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/__pycache__/saving_api.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/__pycache__/saving_api.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..ac6d6af4642b40630e3a08479c5017676fac6c18
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/__pycache__/saving_api.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/__pycache__/saving_lib.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/__pycache__/saving_lib.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..f511129db4d57ea2b6d3f837c1517a571299fb8c
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/__pycache__/saving_lib.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/__pycache__/serialization_lib.cpython-310.pyc b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/__pycache__/serialization_lib.cpython-310.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..11d8d70e7b0ca4a290dd3b95c2fd67045e081c47
Binary files /dev/null and b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/__pycache__/serialization_lib.cpython-310.pyc differ
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/file_editor.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/file_editor.py
new file mode 100644
index 0000000000000000000000000000000000000000..09cd7b87c14c9b5c7cbaa0322400385c1af04ed4
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/file_editor.py
@@ -0,0 +1,817 @@
+import collections
+import json
+import pprint
+import zipfile
+
+import h5py
+import numpy as np
+import rich.console
+
+from keras.src import backend
+from keras.src.api_export import keras_export
+from keras.src.saving import saving_lib
+from keras.src.saving.saving_lib import H5IOStore
+from keras.src.utils import naming
+from keras.src.utils import summary_utils
+
+try:
+    import IPython as ipython
+except ImportError:
+    ipython = None
+
+
+def is_ipython_notebook():
+    """Checks if the code is being executed in a notebook."""
+    try:
+        from IPython import get_ipython
+
+        # Check if an active IPython shell exists.
+        if get_ipython() is not None:
+            return True
+        return False
+    except ImportError:
+        return False
+
+
+@keras_export("keras.saving.KerasFileEditor")
+class KerasFileEditor:
+    """Utility to inspect, edit, and resave Keras weights files.
+
+    You will find this class useful when adapting
+    an old saved weights file after having made
+    architecture changes to a model.
+
+    Args:
+        filepath: The path to a local file to inspect and edit.
+
+    Examples:
+
+    ```python
+    editor = KerasFileEditor("my_model.weights.h5")
+
+    # Displays current contents
+    editor.summary()
+
+    # Remove the weights of an existing layer
+    editor.delete_object("layers/dense_2")
+
+    # Add the weights of a new layer
+    editor.add_object("layers/einsum_dense", weights={"0": ..., "1": ...})
+
+    # Save the weights of the edited model
+    editor.resave_weights("edited_model.weights.h5")
+    ```
+    """
+
+    def __init__(
+        self,
+        filepath,
+    ):
+        self.filepath = filepath
+        self.metadata = None
+        self.config = None
+        self.model = None
+        self.console = rich.console.Console(highlight=False)
+
+        if filepath.endswith(".keras"):
+            zf = zipfile.ZipFile(filepath, "r")
+            weights_store = H5IOStore(
+                saving_lib._VARS_FNAME + ".h5",
+                archive=zf,
+                mode="r",
+            )
+            with zf.open(saving_lib._CONFIG_FILENAME, "r") as f:
+                config_json = f.read()
+            with zf.open(saving_lib._METADATA_FILENAME, "r") as f:
+                metadata_json = f.read()
+            self.config = json.loads(config_json)
+            self.metadata = json.loads(metadata_json)
+
+        elif filepath.endswith(".weights.h5"):
+            weights_store = H5IOStore(filepath, mode="r")
+        else:
+            raise ValueError(
+                "Invalid filename: "
+                "expected a `.keras` `.weights.h5` extension. "
+                f"Received: filepath={filepath}"
+            )
+
+        weights_dict, object_metadata = self._extract_weights_from_store(
+            weights_store.h5_file
+        )
+        weights_store.close()
+        self.weights_dict = weights_dict
+        self.object_metadata = object_metadata  # {path: object_name}
+        self.console.print(self._generate_filepath_info(rich_style=True))
+
+        if self.metadata is not None:
+            self.console.print(self._generate_metadata_info(rich_style=True))
+
+    def summary(self):
+        """Prints the weight structure of the opened file."""
+        self._weights_summary_cli()
+
+    def compare(self, reference_model):
+        """Compares the opened file to a reference model.
+
+        This method will list all mismatches between the
+        currently opened file and the provided reference model.
+
+        Args:
+            reference_model: Model instance to compare to.
+
+        Returns:
+            Dict with the following keys:
+            `'status'`, `'error_count'`, `'match_count'`.
+            Status can be `'success'` or `'error'`.
+            `'error_count'` is the number of mismatches found.
+            `'match_count'` is the number of matching weights found.
+        """
+        self.console.print("Running comparison")
+        ref_spec = {}
+        get_weight_spec_of_saveable(reference_model, ref_spec)
+
+        def _compare(
+            target,
+            ref_spec,
+            inner_path,
+            target_name,
+            ref_name,
+            error_count,
+            match_count,
+            checked_paths,
+        ):
+            base_inner_path = inner_path
+            for ref_key, ref_val in ref_spec.items():
+                inner_path = base_inner_path + "/" + ref_key
+                if inner_path in checked_paths:
+                    continue
+
+                if ref_key not in target:
+                    error_count += 1
+                    checked_paths.add(inner_path)
+                    if isinstance(ref_val, dict):
+                        self.console.print(
+                            f"[color(160)]...Object [bold]{inner_path}[/] "
+                            f"present in {ref_name}, "
+                            f"missing from {target_name}[/]"
+                        )
+                        self.console.print(
+                            f"    In {ref_name}, {inner_path} contains "
+                            f"the following keys: {list(ref_val.keys())}"
+                        )
+                    else:
+                        self.console.print(
+                            f"[color(160)]...Weight [bold]{inner_path}[/] "
+                            f"present in {ref_name}, "
+                            f"missing from {target_name}[/]"
+                        )
+                elif isinstance(ref_val, dict):
+                    _error_count, _match_count = _compare(
+                        target[ref_key],
+                        ref_spec[ref_key],
+                        inner_path,
+                        target_name,
+                        ref_name,
+                        error_count=error_count,
+                        match_count=match_count,
+                        checked_paths=checked_paths,
+                    )
+                    error_count += _error_count
+                    match_count += _match_count
+                else:
+                    if target[ref_key].shape != ref_val.shape:
+                        error_count += 1
+                        checked_paths.add(inner_path)
+                        self.console.print(
+                            f"[color(160)]...Weight shape mismatch "
+                            f"for [bold]{inner_path}[/][/]\n"
+                            f"    In {ref_name}: "
+                            f"shape={ref_val.shape}\n"
+                            f"    In {target_name}: "
+                            f"shape={target[ref_key].shape}"
+                        )
+                    else:
+                        match_count += 1
+            return error_count, match_count
+
+        checked_paths = set()
+        error_count, match_count = _compare(
+            self.weights_dict,
+            ref_spec,
+            inner_path="",
+            target_name="saved file",
+            ref_name="reference model",
+            error_count=0,
+            match_count=0,
+            checked_paths=checked_paths,
+        )
+        _error_count, _ = _compare(
+            ref_spec,
+            self.weights_dict,
+            inner_path="",
+            target_name="reference model",
+            ref_name="saved file",
+            error_count=0,
+            match_count=0,
+            checked_paths=checked_paths,
+        )
+        error_count += _error_count
+        self.console.print("─────────────────────")
+        if error_count == 0:
+            status = "success"
+            self.console.print(
+                "[color(28)][bold]Comparison successful:[/] "
+                "saved file is compatible with the reference model[/]"
+            )
+            if match_count == 1:
+                plural = ""
+            else:
+                plural = "s"
+            self.console.print(
+                f"    Found {match_count} matching weight{plural}"
+            )
+        else:
+            status = "error"
+            if error_count == 1:
+                plural = ""
+            else:
+                plural = "s"
+            self.console.print(
+                f"[color(160)][bold]Found {error_count} error{plural}:[/] "
+                "saved file is not compatible with the reference model[/]"
+            )
+        return {
+            "status": status,
+            "error_count": error_count,
+            "match_count": match_count,
+        }
+
+    def _edit_object(self, edit_fn, source_name, target_name=None):
+        if target_name is not None and "/" in target_name:
+            raise ValueError(
+                "Argument `target_name` should be a leaf name, "
+                "not a full path name. "
+                f"Received: target_name='{target_name}'"
+            )
+        if "/" in source_name:
+            # It's a path
+            elements = source_name.split("/")
+            weights_dict = self.weights_dict
+            for e in elements[:-1]:
+                if e not in weights_dict:
+                    raise ValueError(
+                        f"Path '{source_name}' not found in model."
+                    )
+                weights_dict = weights_dict[e]
+            if elements[-1] not in weights_dict:
+                raise ValueError(f"Path '{source_name}' not found in model.")
+            edit_fn(
+                weights_dict, source_name=elements[-1], target_name=target_name
+            )
+        else:
+            # Ensure unicity
+            def count_occurences(d, name, count=0):
+                for k in d:
+                    if isinstance(d[k], dict):
+                        count += count_occurences(d[k], name, count)
+                if name in d:
+                    count += 1
+                return count
+
+            occurrences = count_occurences(self.weights_dict, source_name)
+            if occurrences > 1:
+                raise ValueError(
+                    f"Name '{source_name}' occurs more than once in the model; "
+                    "try passing a complete path"
+                )
+            if occurrences == 0:
+                raise ValueError(
+                    f"Source name '{source_name}' does not appear in the "
+                    "model. Use `editor.weights_summary()` "
+                    "to list all objects."
+                )
+
+            def _edit(d):
+                for k in d:
+                    if isinstance(d[k], dict):
+                        _edit(d[k])
+                if source_name in d:
+                    edit_fn(d, source_name=source_name, target_name=target_name)
+
+            _edit(self.weights_dict)
+
+    def rename_object(self, object_name, new_name):
+        """Rename an object in the file (e.g. a layer).
+
+        Args:
+            object_name: String, name or path of the
+                object to rename (e.g. `"dense_2"` or
+                `"layers/dense_2"`).
+            new_name: String, new name of the object.
+        """
+
+        def rename_fn(weights_dict, source_name, target_name):
+            weights_dict[target_name] = weights_dict[source_name]
+            weights_dict.pop(source_name)
+
+        self._edit_object(rename_fn, object_name, new_name)
+
+    def delete_object(self, object_name):
+        """Removes an object from the file (e.g. a layer).
+
+        Args:
+            object_name: String, name or path of the
+                object to delete (e.g. `"dense_2"` or
+                `"layers/dense_2"`).
+        """
+
+        def delete_fn(weights_dict, source_name, target_name=None):
+            weights_dict.pop(source_name)
+
+        self._edit_object(delete_fn, object_name)
+
+    def add_object(self, object_path, weights):
+        """Add a new object to the file (e.g. a layer).
+
+        Args:
+            object_path: String, full path of the
+                object to add (e.g. `"layers/dense_2"`).
+            weights: Dict mapping weight names to weight
+                values (arrays),
+                e.g. `{"0": kernel_value, "1": bias_value}`.
+        """
+        if not isinstance(weights, dict):
+            raise ValueError(
+                "Argument `weights` should be a dict "
+                "where keys are weight names (usually '0', '1', etc.) "
+                "and values are NumPy arrays. "
+                f"Received: type(weights)={type(weights)}"
+            )
+
+        if "/" in object_path:
+            # It's a path
+            elements = object_path.split("/")
+            partial_path = "/".join(elements[:-1])
+            weights_dict = self.weights_dict
+            for e in elements[:-1]:
+                if e not in weights_dict:
+                    raise ValueError(
+                        f"Path '{partial_path}' not found in model."
+                    )
+                weights_dict = weights_dict[e]
+            weights_dict[elements[-1]] = weights
+        else:
+            self.weights_dict[object_path] = weights
+
+    def delete_weight(self, object_name, weight_name):
+        """Removes a weight from an existing object.
+
+        Args:
+            object_name: String, name or path of the
+                object from which to remove the weight
+                (e.g. `"dense_2"` or `"layers/dense_2"`).
+            weight_name: String, name of the weight to
+                delete (e.g. `"0"`).
+        """
+
+        def delete_weight_fn(weights_dict, source_name, target_name=None):
+            if weight_name not in weights_dict[source_name]:
+                raise ValueError(
+                    f"Weight {weight_name} not found "
+                    f"in object {object_name}. "
+                    "Weights found: "
+                    f"{list(weights_dict[source_name].keys())}"
+                )
+            weights_dict[source_name].pop(weight_name)
+
+        self._edit_object(delete_weight_fn, object_name)
+
+    def add_weights(self, object_name, weights):
+        """Add one or more new weights to an existing object.
+
+        Args:
+            object_name: String, name or path of the
+                object to add the weights to
+                (e.g. `"dense_2"` or `"layers/dense_2"`).
+            weights: Dict mapping weight names to weight
+                values (arrays),
+                e.g. `{"0": kernel_value, "1": bias_value}`.
+        """
+        if not isinstance(weights, dict):
+            raise ValueError(
+                "Argument `weights` should be a dict "
+                "where keys are weight names (usually '0', '1', etc.) "
+                "and values are NumPy arrays. "
+                f"Received: type(weights)={type(weights)}"
+            )
+
+        def add_weight_fn(weights_dict, source_name, target_name=None):
+            weights_dict[source_name].update(weights)
+
+        self._edit_object(add_weight_fn, object_name)
+
+    def save(self, filepath):
+        """Save the edited weights file.
+
+        Args:
+            filepath: Path to save the file to.
+                Must be a `.weights.h5` file.
+        """
+        filepath = str(filepath)
+        if not filepath.endswith(".weights.h5"):
+            raise ValueError(
+                "Invalid `filepath` argument: "
+                "expected a `.weights.h5` extension. "
+                f"Received: filepath={filepath}"
+            )
+        weights_store = H5IOStore(filepath, mode="w")
+
+        def _save(weights_dict, weights_store, inner_path):
+            vars_to_create = {}
+            for name, value in weights_dict.items():
+                if isinstance(value, dict):
+                    if value:
+                        _save(
+                            weights_dict[name],
+                            weights_store,
+                            inner_path=inner_path + "/" + name,
+                        )
+                else:
+                    # e.g. name="0", value=HDF5Dataset
+                    vars_to_create[name] = value
+            if vars_to_create:
+                var_store = weights_store.make(inner_path)
+                for name, value in vars_to_create.items():
+                    var_store[name] = value
+
+        _save(self.weights_dict, weights_store, inner_path="")
+        weights_store.close()
+
+    def resave_weights(self, filepath):
+        self.save(filepath)
+
+    def _extract_weights_from_store(self, data, metadata=None, inner_path=""):
+        metadata = metadata or {}
+
+        object_metadata = {}
+        for k, v in data.attrs.items():
+            object_metadata[k] = v
+        if object_metadata:
+            metadata[inner_path] = object_metadata
+
+        result = collections.OrderedDict()
+        for key in data.keys():
+            inner_path = inner_path + "/" + key
+            value = data[key]
+            if isinstance(value, h5py.Group):
+                if len(value) == 0:
+                    continue
+                if "vars" in value.keys() and len(value["vars"]) == 0:
+                    continue
+
+            if hasattr(value, "keys"):
+                if "vars" in value.keys():
+                    result[key], metadata = self._extract_weights_from_store(
+                        value["vars"], metadata=metadata, inner_path=inner_path
+                    )
+                else:
+                    result[key], metadata = self._extract_weights_from_store(
+                        value, metadata=metadata, inner_path=inner_path
+                    )
+            else:
+                result[key] = value[()]
+        return result, metadata
+
+    def _generate_filepath_info(self, rich_style=False):
+        if rich_style:
+            filepath = f"'{self.filepath}'"
+            filepath = f"{summary_utils.highlight_symbol(filepath)}"
+        else:
+            filepath = f"'{self.filepath}'"
+        return f"Keras model file {filepath}"
+
+    def _generate_config_info(self, rich_style=False):
+        return pprint.pformat(self.config)
+
+    def _generate_metadata_info(self, rich_style=False):
+        version = self.metadata["keras_version"]
+        date = self.metadata["date_saved"]
+        if rich_style:
+            version = f"{summary_utils.highlight_symbol(version)}"
+            date = f"{summary_utils.highlight_symbol(date)}"
+        return f"Saved with Keras {version} " f"- date: {date}"
+
+    def _print_weights_structure(
+        self, weights_dict, indent=0, is_first=True, prefix="", inner_path=""
+    ):
+        for idx, (key, value) in enumerate(weights_dict.items()):
+            inner_path = inner_path + "/" + key
+            is_last = idx == len(weights_dict) - 1
+            if is_first:
+                is_first = False
+                connector = "> "
+            elif is_last:
+                connector = "└─ "
+            else:
+                connector = "├─ "
+
+            if isinstance(value, dict):
+                bold_key = summary_utils.bold_text(key)
+                object_label = f"{prefix}{connector}{bold_key}"
+                if inner_path in self.object_metadata:
+                    metadata = self.object_metadata[inner_path]
+                    if "name" in metadata:
+                        name = metadata["name"]
+                        object_label += f" ('{name}')"
+                self.console.print(object_label)
+                if is_last:
+                    appended = "    "
+                else:
+                    appended = "│   "
+                new_prefix = prefix + appended
+                self._print_weights_structure(
+                    value,
+                    indent + 1,
+                    is_first=is_first,
+                    prefix=new_prefix,
+                    inner_path=inner_path,
+                )
+            else:
+                if hasattr(value, "shape"):
+                    bold_key = summary_utils.bold_text(key)
+                    self.console.print(
+                        f"{prefix}{connector}{bold_key}:"
+                        + f" shape={value.shape}, dtype={value.dtype}"
+                    )
+                else:
+                    self.console.print(f"{prefix}{connector}{key}: {value}")
+
+    def _weights_summary_cli(self):
+        self.console.print("Weights structure")
+        self._print_weights_structure(self.weights_dict, prefix=" " * 2)
+
+    def _weights_summary_interactive(self):
+        def _generate_html_weights(dictionary, margin_left=0, font_size=1):
+            html = ""
+            for key, value in dictionary.items():
+                if isinstance(value, dict) and value:
+                    html += (
+                        f'<details style="margin-left: {margin_left}px;">'
+                        + '<summary style="'
+                        + f"font-size: {font_size}em; "
+                        + "font-weight: bold;"
+                        + f'">{key}</summary>'
+                        + _generate_html_weights(
+                            value, margin_left + 20, font_size - 1
+                        )
+                        + "</details>"
+                    )
+                else:
+                    html += (
+                        f'<details style="margin-left: {margin_left}px;">'
+                        + f'<summary style="font-size: {font_size}em;">'
+                        + f"{key} : shape={value.shape}"
+                        + f", dtype={value.dtype}</summary>"
+                        + f"<div style="
+                        f'"margin-left: {margin_left}px;'
+                        f'"margin-top: {margin_left}px;">'
+                        + f"{display_weight(value)}"
+                        + "</div>"
+                        + "</details>"
+                    )
+            return html
+
+        output = "Weights structure"
+
+        initialize_id_counter()
+        output += _generate_html_weights(self.weights_dict)
+        ipython.display.display(ipython.display.HTML(output))
+
+
+def get_weight_spec_of_saveable(saveable, spec, visited_saveables=None):
+    from keras.src.saving.keras_saveable import KerasSaveable
+
+    visited_saveables = visited_saveables or set()
+
+    # If the saveable has already been saved, skip it.
+    if id(saveable) in visited_saveables:
+        return
+
+    if hasattr(saveable, "save_own_variables"):
+        store = {}
+        saveable.save_own_variables(store)
+        if store:
+            keys = sorted(store.keys())
+            for k in keys:
+                val = store[k]
+                spec[k] = backend.KerasTensor(shape=val.shape, dtype=val.dtype)
+
+    visited_saveables.add(id(saveable))
+
+    for child_attr, child_obj in saving_lib._walk_saveable(saveable):
+        if isinstance(child_obj, KerasSaveable):
+            sub_spec = {}
+            get_weight_spec_of_saveable(
+                child_obj,
+                sub_spec,
+                visited_saveables=visited_saveables,
+            )
+            if sub_spec:
+                spec[child_attr] = sub_spec
+        elif isinstance(child_obj, (list, dict, tuple, set)):
+            sub_spec = {}
+            get_weight_spec_of_container(
+                child_obj,
+                sub_spec,
+                visited_saveables=visited_saveables,
+            )
+            if sub_spec:
+                spec[child_attr] = sub_spec
+
+
+def get_weight_spec_of_container(container, spec, visited_saveables):
+    from keras.src.saving.keras_saveable import KerasSaveable
+
+    used_names = {}
+    if isinstance(container, dict):
+        container = list(container.values())
+
+    for saveable in container:
+        if isinstance(saveable, KerasSaveable):
+            name = naming.to_snake_case(saveable.__class__.__name__)
+            if name in used_names:
+                used_names[name] += 1
+                name = f"{name}_{used_names[name]}"
+            else:
+                used_names[name] = 0
+            sub_spec = {}
+            get_weight_spec_of_saveable(
+                saveable,
+                sub_spec,
+                visited_saveables=visited_saveables,
+            )
+            if sub_spec:
+                spec[name] = sub_spec
+
+
+def initialize_id_counter():
+    global div_id_counter
+    div_id_counter = 0
+
+
+def increment_id_counter():
+    global div_id_counter
+    div_id_counter += 1
+
+
+def get_id_counter():
+    return div_id_counter
+
+
+def display_weight(weight, axis=-1, threshold=16):
+    def _find_factors_closest_to_sqrt(num):
+        sqrt_num = int(np.sqrt(num))
+
+        for i in range(sqrt_num, 0, -1):
+            if num % i == 0:
+                M = i
+                N = num // i
+
+                if M > N:
+                    return N, M
+                return M, N
+
+    def _color_from_rbg(value):
+        return f"rgba({value[0]}, {value[1]}, {value[2]}, 1)"
+
+    def _reduce_3d_array_by_mean(arr, n, axis):
+        if axis == 2:
+            trimmed_arr = arr[:, :, : arr.shape[2] - (arr.shape[2] % n)]
+            reshaped = np.reshape(
+                trimmed_arr, (arr.shape[0], arr.shape[1], -1, n)
+            )
+            mean_values = np.mean(reshaped, axis=3)
+
+        elif axis == 1:
+            trimmed_arr = arr[:, : arr.shape[1] - (arr.shape[1] % n), :]
+            reshaped = np.reshape(
+                trimmed_arr, (arr.shape[0], -1, n, arr.shape[2])
+            )
+            mean_values = np.mean(reshaped, axis=2)
+
+        elif axis == 0:
+            trimmed_arr = arr[: arr.shape[0] - (arr.shape[0] % n), :, :]
+            reshaped = np.reshape(
+                trimmed_arr, (-1, n, arr.shape[1], arr.shape[2])
+            )
+            mean_values = np.mean(reshaped, axis=1)
+
+        else:
+            raise ValueError("Axis must be 0, 1, or 2.")
+
+        return mean_values
+
+    def _create_matrix_html(matrix, subplot_size=840):
+        rows, cols, num_slices = matrix.shape
+
+        M, N = _find_factors_closest_to_sqrt(num_slices)
+
+        try:
+            from matplotlib import cm
+        except ImportError:
+            cm = None
+        if cm:
+            rgb_matrix = cm.jet(matrix)
+        else:
+            rgb_matrix = (matrix - np.min(matrix)) / (
+                np.max(matrix) - np.min(matrix)
+            )
+            rgb_matrix = np.stack([rgb_matrix, rgb_matrix, rgb_matrix], axis=-1)
+        rgb_matrix = (rgb_matrix[..., :3] * 255).astype("uint8")
+
+        subplot_html = ""
+        for i in range(num_slices):
+            cell_html = ""
+            for row in rgb_matrix[..., i, :]:
+                for rgb in row:
+                    color = _color_from_rbg(rgb)
+                    cell_html += (
+                        f'<div class="cell" '
+                        f'style="background-color: {color};">'
+                        f"</div>"
+                    )
+            subplot_html += f"""
+                        <div class="matrix">
+                          {cell_html}
+                        </div>
+                        """
+
+        cell_size = subplot_size // (N * cols)
+
+        increment_id_counter()
+        div_id = get_id_counter()
+
+        html_code = f"""
+            <div class="unique-container_{div_id}">
+                  <style>
+                      .unique-container_{div_id} .subplots {{
+                      display: inline-grid;
+                      grid-template-columns: repeat({N}, 1fr);
+                      column-gap: 5px;  /* Minimal horizontal gap */
+                      row-gap: 5px;     /* Small vertical gap */
+                      margin: 0;
+                      padding: 0;
+                    }}
+                    .unique-container_{div_id} .matrix {{
+                      display: inline-grid;
+                      grid-template-columns: repeat({cols}, {cell_size}px);
+                      grid-template-rows: repeat({rows}, {cell_size}px);
+                      gap: 1px;
+                      margin: 0;
+                      padding: 0;
+                    }}
+                    .unique-container_{div_id} .cell {{
+                      width: {cell_size}px;
+                      height: {cell_size}px;
+                      display: flex;
+                      justify-content: center;
+                      align-items: center;
+                      font-size: 5px;
+                      font-weight: bold;
+                      color: white;
+                    }}
+                     .unique-container_{div_id} {{
+                      margin-top: 20px;
+                      margin-bottom: 20px;
+                    }}
+                  </style>
+                  <div class="subplots">
+                    {subplot_html}
+                  </div>
+                  </div>
+                """
+
+        return html_code
+
+    if weight.ndim == 1:
+        weight = weight[..., np.newaxis]
+
+    weight = np.swapaxes(weight, axis, -1)
+    weight = weight.reshape(-1, weight.shape[-1])
+
+    M, N = _find_factors_closest_to_sqrt(weight.shape[0])
+    weight = weight.reshape(M, N, weight.shape[-1])
+
+    for reduce_axis in [0, 1, 2]:
+        if weight.shape[reduce_axis] > threshold:
+            weight = _reduce_3d_array_by_mean(
+                weight,
+                weight.shape[reduce_axis] // threshold,
+                axis=reduce_axis,
+            )
+
+    weight = (weight - weight.min()) / (weight.max() - weight.min() + 1e-5)
+
+    html_code = _create_matrix_html(weight)
+    return html_code
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/keras_saveable.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/keras_saveable.py
new file mode 100644
index 0000000000000000000000000000000000000000..7fc536b470cba43698102a69c92bb1eea327b280
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/keras_saveable.py
@@ -0,0 +1,38 @@
+import io
+
+
+class KerasSaveable:
+    # Note: renaming this function will cause old pickles to be broken.
+    # This is probably not a huge deal, as pickle should not be a recommended
+    # saving format -- it should only be supported for use with distributed
+    # computing frameworks.
+
+    def _obj_type(self):
+        raise NotImplementedError(
+            "KerasSaveable subclases must provide an "
+            "implementation for `obj_type()`"
+        )
+
+    @classmethod
+    def _unpickle_model(cls, bytesio):
+        import keras.src.saving.saving_lib as saving_lib
+
+        # pickle is not safe regardless of what you do.
+        return saving_lib._load_model_from_fileobj(
+            bytesio, custom_objects=None, compile=True, safe_mode=False
+        )
+
+    def __reduce__(self):
+        """__reduce__ is used to customize the behavior of `pickle.pickle()`.
+
+        The method returns a tuple of two elements: a function, and a list of
+        arguments to pass to that function.  In this case we just leverage the
+        keras saving library."""
+        import keras.src.saving.saving_lib as saving_lib
+
+        buf = io.BytesIO()
+        saving_lib._save_model_to_fileobj(self, buf, "h5")
+        return (
+            self._unpickle_model,
+            (buf,),
+        )
diff --git a/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/object_registration.py b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/object_registration.py
new file mode 100644
index 0000000000000000000000000000000000000000..8c0f538917bd57e4ce284a93cee0b1fe233fe8f3
--- /dev/null
+++ b/SwarmUI/dlbackend/ComfyUI/venv/lib/python3.10/site-packages/keras/src/saving/object_registration.py
@@ -0,0 +1,230 @@
+import inspect
+
+from keras.src.api_export import keras_export
+from keras.src.backend.common import global_state
+
+GLOBAL_CUSTOM_OBJECTS = {}
+GLOBAL_CUSTOM_NAMES = {}
+
+
+@keras_export(
+    [
+        "keras.saving.CustomObjectScope",
+        "keras.saving.custom_object_scope",
+        "keras.utils.CustomObjectScope",
+        "keras.utils.custom_object_scope",
+    ]
+)
+class CustomObjectScope:
+    """Exposes custom classes/functions to Keras deserialization internals.
+
+    Under a scope `with custom_object_scope(objects_dict)`, Keras methods such
+    as `keras.models.load_model()` or
+    `keras.models.model_from_config()` will be able to deserialize any
+    custom object referenced by a saved config (e.g. a custom layer or metric).
+
+    Example:
+
+    Consider a custom regularizer `my_regularizer`:
+
+    ```python
+    layer = Dense(3, kernel_regularizer=my_regularizer)
+    # Config contains a reference to `my_regularizer`
+    config = layer.get_config()
+    ...
+    # Later:
+    with custom_object_scope({'my_regularizer': my_regularizer}):
+        layer = Dense.from_config(config)
+    ```
+
+    Args:
+        custom_objects: Dictionary of `{str: object}` pairs,
+            where the `str` key is the object name.
+    """
+
+    def __init__(self, custom_objects):
+        self.custom_objects = custom_objects or {}
+        self.backup = None
+
+    def __enter__(self):
+        self.backup = global_state.get_global_attribute(
+            "custom_objects_scope_dict", {}
+        ).copy()
+        global_state.set_global_attribute(
+            "custom_objects_scope_dict", self.custom_objects.copy()
+        )
+        return self
+
+    def __exit__(self, *args, **kwargs):
+        global_state.set_global_attribute(
+            "custom_objects_scope_dict", self.backup.copy()
+        )
+
+
+# Alias.
+custom_object_scope = CustomObjectScope
+
+
+@keras_export(
+    [
+        "keras.saving.get_custom_objects",
+        "keras.utils.get_custom_objects",
+    ]
+)
+def get_custom_objects():
+    """Retrieves a live reference to the global dictionary of custom objects.
+
+    Custom objects set using `custom_object_scope()` are not added to the
+    global dictionary of custom objects, and will not appear in the returned
+    dictionary.
+
+    Example:
+
+    ```python
+    get_custom_objects().clear()
+    get_custom_objects()['MyObject'] = MyObject
+    ```
+
+    Returns:
+        Global dictionary mapping registered class names to classes.
+    """
+    return GLOBAL_CUSTOM_OBJECTS
+
+
+@keras_export(
+    [
+        "keras.saving.register_keras_serializable",
+        "keras.utils.register_keras_serializable",
+    ]
+)
+def register_keras_serializable(package="Custom", name=None):
+    """Registers an object with the Keras serialization framework.
+
+    This decorator injects the decorated class or function into the Keras custom
+    object dictionary, so that it can be serialized and deserialized without
+    needing an entry in the user-provided custom object dict. It also injects a
+    function that Keras will call to get the object's serializable string key.
+
+    Note that to be serialized and deserialized, classes must implement the
+    `get_config()` method. Functions do not have this requirement.
+
+    The object will be registered under the key `'package>name'` where `name`,
+    defaults to the object name if not passed.
+
+    Example:
+
+    ```python
+    # Note that `'my_package'` is used as the `package` argument here, and since
+    # the `name` argument is not provided, `'MyDense'` is used as the `name`.
+    @register_keras_serializable('my_package')
+    class MyDense(keras.layers.Dense):
+        pass
+
+    assert get_registered_object('my_package>MyDense') == MyDense
+    assert get_registered_name(MyDense) == 'my_package>MyDense'
+    ```
+
+    Args:
+        package: The package that this class belongs to. This is used for the
+            `key` (which is `"package>name"`) to identify the class. Note that
+            this is the first argument passed into the decorator.
+        name: The name to serialize this class under in this package. If not
+            provided or `None`, the class' name will be used (note that this is
+            the case when the decorator is used with only one argument, which
+            becomes the `package`).
+
+    Returns:
+        A decorator that registers the decorated class with the passed names.
+    """
+
+    def decorator(arg):
+        """Registers a class with the Keras serialization framework."""
+        class_name = name if name is not None else arg.__name__
+        registered_name = package + ">" + class_name
+
+        if inspect.isclass(arg) and not hasattr(arg, "get_config"):
+            raise ValueError(
+                "Cannot register a class that does not have a "
+                "get_config() method."
+            )
+
+        GLOBAL_CUSTOM_OBJECTS[registered_name] = arg
+        GLOBAL_CUSTOM_NAMES[arg] = registered_name
+
+        return arg
+
+    return decorator
+
+
+@keras_export(
+    [
+        "keras.saving.get_registered_name",
+        "keras.utils.get_registered_name",
+    ]
+)
+def get_registered_name(obj):
+    """Returns the name registered to an object within the Keras framework.
+
+    This function is part of the Keras serialization and deserialization
+    framework. It maps objects to the string names associated with those objects
+    for serialization/deserialization.
+
+    Args:
+        obj: The object to look up.
+
+    Returns:
+        The name associated with the object, or the default Python name if the
+            object is not registered.
+    """
+    if obj in GLOBAL_CUSTOM_NAMES:
+        return GLOBAL_CUSTOM_NAMES[obj]
+    else:
+        return obj.__name__
+
+
+@keras_export(
+    [
+        "keras.saving.get_registered_object",
+        "keras.utils.get_registered_object",
+    ]
+)
+def get_registered_object(name, custom_objects=None, module_objects=None):
+    """Returns the class associated with `name` if it is registered with Keras.
+
+    This function is part of the Keras serialization and deserialization
+    framework. It maps strings to the objects associated with them for
+    serialization/deserialization.
+
+    Example:
+
+    ```python
+    def from_config(cls, config, custom_objects=None):
+        if 'my_custom_object_name' in config:
+            config['hidden_cls'] = tf.keras.saving.get_registered_object(
+                config['my_custom_object_name'], custom_objects=custom_objects)
+    ```
+
+    Args:
+        name: The name to look up.
+        custom_objects: A dictionary of custom objects to look the name up in.
+            Generally, custom_objects is provided by the user.
+        module_objects: A dictionary of custom objects to look the name up in.
+            Generally, module_objects is provided by midlevel library
+            implementers.
+
+    Returns:
+        An instantiable class associated with `name`, or `None` if no such class
+            exists.
+    """
+    custom_objects_scope_dict = global_state.get_global_attribute(
+        "custom_objects_scope_dict", {}
+    )
+    if name in custom_objects_scope_dict:
+        return custom_objects_scope_dict[name]
+    elif name in GLOBAL_CUSTOM_OBJECTS:
+        return GLOBAL_CUSTOM_OBJECTS[name]
+    elif custom_objects and name in custom_objects:
+        return custom_objects[name]
+    elif module_objects and name in module_objects:
+        return module_objects[name]
+    return None