Rename modules jax_linker to linker and jax_dispatch to dispatch

4fa10665 · Brandon T. Willard · Brandon T. Willard · c9333bcf · 4fa10665 · 4fa10665
--- a/aesara/link/jax/__init__.py
+++ b/aesara/link/jax/__init__.py
-from aesara.link.jax.jax_linker import JAXLinker
+from aesara.link.jax.linker import JAXLinker
--- a/aesara/link/jax/dispatch.py
+++ b/aesara/link/jax/dispatch.py
+import ast
+import re
+import warnings
+from collections import Counter
+from functools import reduce, singledispatch
+from keyword import iskeyword
+from tempfile import NamedTemporaryFile
+from textwrap import indent
+from types import FunctionType
+from warnings import warn
+import jax
+import jax.numpy as jnp
+import jax.scipy as jsp
+import numpy as np
+from numpy.random import RandomState
+from aesara.compile.ops import DeepCopyOp, ViewOp
+from aesara.configdefaults import config
+from aesara.graph.basic import Constant, Variable
+from aesara.graph.fg import FunctionGraph
+from aesara.ifelse import IfElse
+from aesara.link.utils import map_storage
+from aesara.scalar.basic import Cast, Clip, Composite, Identity, ScalarOp, Second
+from aesara.scan.op import Scan
+from aesara.scan.utils import scan_args as ScanArgs
+from aesara.tensor.basic import (
+    Alloc,
+    AllocDiag,
+    AllocEmpty,
+    ARange,
+    ExtractDiag,
+    Eye,
+    Join,
+    MakeVector,
+    Rebroadcast,
+    ScalarFromTensor,
+    TensorFromScalar,
+)
+from aesara.tensor.blas import BatchedDot
+from aesara.tensor.elemwise import CAReduce, DimShuffle, Elemwise
+from aesara.tensor.extra_ops import (
+    Bartlett,
+    CumOp,
+    DiffOp,
+    FillDiagonal,
+    FillDiagonalOffset,
+    RavelMultiIndex,
+    RepeatOp,
+    Unique,
+    UnravelIndex,
+)
+from aesara.tensor.math import Dot, MaxAndArgmax
+from aesara.tensor.nlinalg import (
+    SVD,
+    Det,
+    Eig,
+    Eigh,
+    MatrixInverse,
+    QRFull,
+    QRIncomplete,
+)
+from aesara.tensor.nnet.basic import LogSoftmax, Softmax
+from aesara.tensor.nnet.sigm import ScalarSoftplus
+from aesara.tensor.random.op import RandomVariable
+from aesara.tensor.shape import Reshape, Shape, Shape_i, SpecifyShape
+from aesara.tensor.slinalg import Cholesky, Solve
+from aesara.tensor.subtensor import (
+    AdvancedIncSubtensor,
+    AdvancedIncSubtensor1,
+    AdvancedSubtensor,
+    AdvancedSubtensor1,
+    IncSubtensor,
+    Subtensor,
+    indices_from_subtensor,
+)
+from aesara.tensor.type_other import MakeSlice
+# For use with JAX since JAX doesn't support 'str' arguments
+numpy_bit_gens = {"MT19937": 0, "PCG64": 1, "Philox": 2, "SFC64": 3}
+if config.floatX == "float64":
+    jax.config.update("jax_enable_x64", True)
+else:
+    jax.config.update("jax_enable_x64", False)
+# XXX: Enabling this will break some shape-based functionality, and severely
+# limit the types of graphs that can be converted.
+# See https://github.com/google/jax/blob/4d556837cc9003492f674c012689efc3d68fdf5f/design_notes/omnistaging.md
+# Older versions < 0.2.0 do not have this flag so we don't need to set it.
+try:
+    jax.config.disable_omnistaging()
+except AttributeError:
+    pass
+except Exception as e:
+    # The version might be >= 0.2.12, which means that omnistaging can't be
+    # disabled
+    warnings.warn(f"JAX omnistaging couldn't be disabled: {e}")
+subtensor_ops = (Subtensor, AdvancedSubtensor1, AdvancedSubtensor)
+incsubtensor_ops = (IncSubtensor, AdvancedIncSubtensor1)
+@singledispatch
+def jax_typify(data, dtype):
+    """Convert instances of Aesara `Type`s to JAX types."""
+    if dtype is None:
+        return data
+    else:
+        return jnp.array(data, dtype=dtype)
+@jax_typify.register(np.ndarray)
+def jax_typify_ndarray(data, dtype):
+    return jnp.array(data, dtype=dtype)
+@jax_typify.register(RandomState)
+def jax_typify_RandomState(state, dtype):
+    state = state.get_state(legacy=False)
+    state["bit_generator"] = numpy_bit_gens[state["bit_generator"]]
+    return state
+@singledispatch
+def jax_funcify(op, **kwargs):
+    """Create a JAX compatible function from an Aesara `Op`."""
+    raise NotImplementedError(f"No JAX conversion for the given `Op`: {op}")
+@jax_funcify.register(MakeSlice)
+def jax_funcify_MakeSlice(op):
+    def makeslice(*x):
+        return slice(*x)
+    return makeslice
+@jax_funcify.register(ScalarOp)
+def jax_funcify_ScalarOp(op):
+    func_name = op.nfunc_spec[0]
+    if "." in func_name:
+        jnp_func = reduce(getattr, [jax] + func_name.split("."))
+    else:
+        jnp_func = getattr(jnp, func_name)
+    if hasattr(op, "nfunc_variadic"):
+        # These are special cases that handle invalid arities due to the broken
+        # Aesara `Op` type contract (e.g. binary `Op`s that also function as
+        # their own variadic counterparts--even when those counterparts already
+        # exist as independent `Op`s).
+        jax_variadic_func = getattr(jnp, op.nfunc_variadic)
+        def elemwise(*args):
+            if len(args) > op.nfunc_spec[1]:
+                return jax_variadic_func(
+                    jnp.stack(jnp.broadcast_arrays(*args), axis=0), axis=0
+                )
+            else:
+                return jnp_func(*args)
+        return elemwise
+    else:
+        return jnp_func
+@jax_funcify.register(Clip)
+def jax_funcify_Clip(op):
+    def clip(x, min, max):
+        return jnp.where(x < min, min, jnp.where(x > max, max, x))
+    return clip
+@jax_funcify.register(Identity)
+def jax_funcify_Identity(op):
+    def identity(x):
+        return x
+    return identity
+@jax_funcify.register(Softmax)
+def jax_funcify_Softmax(op):
+    def softmax(x):
+        return jax.nn.softmax(x)
+    return softmax
+@jax_funcify.register(LogSoftmax)
+def jax_funcify_LogSoftmax(op):
+    def log_softmax(x):
+        return jax.nn.log_softmax(x)
+    return log_softmax
+@jax_funcify.register(ScalarSoftplus)
+def jax_funcify_ScalarSoftplus(op):
+    def scalarsoftplus(x):
+        return jnp.where(x < -30.0, 0.0, jnp.where(x > 30.0, x, jnp.log1p(jnp.exp(x))))
+    return scalarsoftplus
+@jax_funcify.register(Second)
+def jax_funcify_Second(op):
+    def second(x, y):
+        return jnp.broadcast_to(y, x.shape)
+    return second
+@jax_funcify.register(AllocDiag)
+def jax_funcify_AllocDiag(op):
+    offset = op.offset
+    def allocdiag(v, offset=offset):
+        return jnp.diag(v, k=offset)
+    return allocdiag
+@jax_funcify.register(AllocEmpty)
+def jax_funcify_AllocEmpty(op):
+    def allocempty(*shape):
+        return jnp.empty(shape, dtype=op.dtype)
+    return allocempty
+@jax_funcify.register(Alloc)
+def jax_funcify_Alloc(op):
+    def alloc(x, *shape):
+        res = jnp.broadcast_to(x, shape)
+        return res
+    return alloc
+@jax_funcify.register(Dot)
+def jax_funcify_Dot(op):
+    def dot(x, y):
+        return jnp.dot(x, y)
+    return dot
+@jax_funcify.register(ARange)
+def jax_funcify_ARange(op):
+    # XXX: This currently requires concrete arguments.
+    def arange(start, stop, step):
+        return jnp.arange(start, stop, step, dtype=op.dtype)
+    return arange
+def jnp_safe_copy(x):
+    try:
+        res = jnp.copy(x)
+    except NotImplementedError:
+        warn("`jnp.copy` is not implemented yet. " "Using the object's `copy` method.")
+        if hasattr(x, "copy"):
+            res = jnp.array(x.copy())
+        else:
+            warn(f"Object has no `copy` method: {x}")
+            res = x
+    return res
+@jax_funcify.register(DeepCopyOp)
+def jax_funcify_DeepCopyOp(op):
+    def deepcopyop(x):
+        return jnp_safe_copy(x)
+    return deepcopyop
+@jax_funcify.register(Shape)
+def jax_funcify_Shape(op):
+    def shape(x):
+        return jnp.shape(x)
+    return shape
+@jax_funcify.register(Shape_i)
+def jax_funcify_Shape_i(op):
+    i = op.i
+    def shape_i(x):
+        return jnp.shape(x)[i]
+    return shape_i
+@jax_funcify.register(SpecifyShape)
+def jax_funcify_SpecifyShape(op):
+    def specifyshape(x, shape):
+        assert x.ndim == len(shape)
+        assert jnp.all(x.shape == tuple(shape)), (
+            "got shape",
+            x.shape,
+            "expected",
+            shape,
+        )
+        return x
+    return specifyshape
+@jax_funcify.register(Rebroadcast)
+def jax_funcify_Rebroadcast(op):
+    op_axis = op.axis
+    def rebroadcast(x):
+        for axis, value in op_axis.items():
+            if value and x.shape[axis] != 1:
+                raise ValueError(
+                    "Dimension %s in Rebroadcast's input was"
+                    " supposed to be 1 (got %s instead)" % (axis, x.shape[axis])
+                )
+        return x
+    return rebroadcast
+@jax_funcify.register(ViewOp)
+def jax_funcify_ViewOp(op):
+    def viewop(x):
+        return x
+    return viewop
+@jax_funcify.register(Cast)
+def jax_funcify_Cast(op):
+    def cast(x):
+        return jnp.array(x).astype(op.o_type.dtype)
+    return cast
+@jax_funcify.register(TensorFromScalar)
+def jax_funcify_TensorFromScalar(op):
+    def tensor_from_scalar(x):
+        return jnp.array(x)
+    return tensor_from_scalar
+@jax_funcify.register(ScalarFromTensor)
+def jax_funcify_ScalarFromTensor(op):
+    def scalar_from_tensor(x):
+        return jnp.array(x).flatten()[0]
+    return scalar_from_tensor
+@jax_funcify.register(Elemwise)
+def jax_funcify_Elemwise(op):
+    scalar_op = op.scalar_op
+    return jax_funcify(scalar_op)
+@jax_funcify.register(Composite)
+def jax_funcify_Composite(op):
+    # This approach basically gets rid of the fused `Elemwise` by turning each
+    # `Op` in the `Composite` back into individually broadcasted NumPy-like
+    # operations.
+    # TODO: A better approach would involve something like `jax.vmap` or some
+    # other operation that can perform the broadcasting that `Elemwise` does.
+    jax_impl = jax_funcify(op.fgraph)
+    def composite(*args):
+        return jax_impl(*args)[0]
+    return composite
+@jax_funcify.register(Scan)
+def jax_funcify_Scan(op):
+    inner_fg = FunctionGraph(op.inputs, op.outputs)
+    jax_aet_inner_func = jax_funcify(inner_fg)
+    def scan(*outer_inputs):
+        scan_args = ScanArgs(
+            list(outer_inputs), [None] * op.n_outs, op.inputs, op.outputs, op.info
+        )
+        # `outer_inputs` is a list with the following composite form:
+        # [n_steps]
+        # + outer_in_seqs
+        # + outer_in_mit_mot
+        # + outer_in_mit_sot
+        # + outer_in_sit_sot
+        # + outer_in_shared
+        # + outer_in_nit_sot
+        # + outer_in_non_seqs
+        n_steps = scan_args.n_steps
+        seqs = scan_args.outer_in_seqs
+        # TODO: mit_mots
+        mit_mot_in_slices = []
+        mit_sot_in_slices = []
+        for tap, seq in zip(scan_args.mit_sot_in_slices, scan_args.outer_in_mit_sot):
+            neg_taps = [abs(t) for t in tap if t < 0]
+            pos_taps = [abs(t) for t in tap if t > 0]
+            max_neg = max(neg_taps) if neg_taps else 0
+            max_pos = max(pos_taps) if pos_taps else 0
+            init_slice = seq[: max_neg + max_pos]
+            mit_sot_in_slices.append(init_slice)
+        sit_sot_in_slices = [seq[0] for seq in scan_args.outer_in_sit_sot]
+        init_carry = (
+            mit_mot_in_slices,
+            mit_sot_in_slices,
+            sit_sot_in_slices,
+            scan_args.outer_in_shared,
+            scan_args.outer_in_non_seqs,
+        )
+        def jax_args_to_inner_scan(op, carry, x):
+            # `carry` contains all inner-output taps, non_seqs, and shared
+            # terms
+            (
+                inner_in_mit_mot,
+                inner_in_mit_sot,
+                inner_in_sit_sot,
+                inner_in_shared,
+                inner_in_non_seqs,
+            ) = carry
+            # `x` contains the in_seqs
+            inner_in_seqs = x
+            # `inner_scan_inputs` is a list with the following composite form:
+            # inner_in_seqs
+            # + sum(inner_in_mit_mot, [])
+            # + sum(inner_in_mit_sot, [])
+            # + inner_in_sit_sot
+            # + inner_in_shared
+            # + inner_in_non_seqs
+            inner_in_mit_sot_flatten = []
+            for array, index in zip(inner_in_mit_sot, scan_args.mit_sot_in_slices):
+                inner_in_mit_sot_flatten.extend(array[jnp.array(index)])
+            inner_scan_inputs = sum(
+                [
+                    inner_in_seqs,
+                    inner_in_mit_mot,
+                    inner_in_mit_sot_flatten,
+                    inner_in_sit_sot,
+                    inner_in_shared,
+                    inner_in_non_seqs,
+                ],
+                [],
+            )
+            return inner_scan_inputs
+        def inner_scan_outs_to_jax_outs(
+            op,
+            old_carry,
+            inner_scan_outs,
+        ):
+            (
+                inner_in_mit_mot,
+                inner_in_mit_sot,
+                inner_in_sit_sot,
+                inner_in_shared,
+                inner_in_non_seqs,
+            ) = old_carry
+            def update_mit_sot(mit_sot, new_val):
+                return jnp.concatenate([mit_sot[1:], new_val[None, ...]], axis=0)
+            inner_out_mit_sot = [
+                update_mit_sot(mit_sot, new_val)
+                for mit_sot, new_val in zip(inner_in_mit_sot, inner_scan_outs)
+            ]
+            # This should contain all inner-output taps, non_seqs, and shared
+            # terms
+            if not inner_in_sit_sot:
+                inner_out_sit_sot = []
+            else:
+                inner_out_sit_sot = inner_scan_outs
+            new_carry = (
+                inner_in_mit_mot,
+                inner_out_mit_sot,
+                inner_out_sit_sot,
+                inner_in_shared,
+                inner_in_non_seqs,
+            )
+            return new_carry
+        def jax_inner_func(carry, x):
+            inner_args = jax_args_to_inner_scan(op, carry, x)
+            inner_scan_outs = [fn(*inner_args) for fn in jax_aet_inner_func]
+            new_carry = inner_scan_outs_to_jax_outs(op, carry, inner_scan_outs)
+            return new_carry, inner_scan_outs
+        _, scan_out = jax.lax.scan(jax_inner_func, init_carry, seqs, length=n_steps)
+        # We need to prepend the initial values so that the JAX output will
+        # match the raw `Scan` `Op` output and, thus, work with a downstream
+        # `Subtensor` `Op` introduced by the `scan` helper function.
+        def append_scan_out(scan_in_part, scan_out_part):
+            return jnp.concatenate([scan_in_part[:-n_steps], scan_out_part], axis=0)
+        if scan_args.outer_in_mit_sot:
+            scan_out_final = [
+                append_scan_out(init, out)
+                for init, out in zip(scan_args.outer_in_mit_sot, scan_out)
+            ]
+        elif scan_args.outer_in_sit_sot:
+            scan_out_final = [
+                append_scan_out(init, out)
+                for init, out in zip(scan_args.outer_in_sit_sot, scan_out)
+            ]
+        if len(scan_out_final) == 1:
+            scan_out_final = scan_out_final[0]
+        return scan_out_final
+    return scan
+@jax_funcify.register(IfElse)
+def jax_funcify_IfElse(op):
+    n_outs = op.n_outs
+    def ifelse(cond, *args, n_outs=n_outs):
+        res = jax.lax.cond(
+            cond, lambda _: args[:n_outs], lambda _: args[n_outs:], operand=None
+        )
+        return res if n_outs > 1 else res[0]
+    return ifelse
+@jax_funcify.register(Subtensor)
+def jax_funcify_Subtensor(op):
+    idx_list = getattr(op, "idx_list", None)
+    def subtensor(x, *ilists):
+        indices = indices_from_subtensor(ilists, idx_list)
+        if len(indices) == 1:
+            indices = indices[0]
+        return x.__getitem__(indices)
+    return subtensor
+_ = [jax_funcify.register(op, jax_funcify_Subtensor) for op in subtensor_ops]
+def jax_funcify_IncSubtensor(op):
+    idx_list = getattr(op, "idx_list", None)
+    if getattr(op, "set_instead_of_inc", False):
+        jax_fn = jax.ops.index_update
+    else:
+        jax_fn = jax.ops.index_add
+    def incsubtensor(x, y, *ilist, jax_fn=jax_fn, idx_list=idx_list):
+        indices = indices_from_subtensor(ilist, idx_list)
+        if len(indices) == 1:
+            indices = indices[0]
+        return jax_fn(x, indices, y)
+    return incsubtensor
+_ = [jax_funcify.register(op, jax_funcify_IncSubtensor) for op in incsubtensor_ops]
+@jax_funcify.register(AdvancedIncSubtensor)
+def jax_funcify_AdvancedIncSubtensor(op):
+    if getattr(op, "set_instead_of_inc", False):
+        jax_fn = jax.ops.index_update
+    else:
+        jax_fn = jax.ops.index_add
+    def advancedincsubtensor(x, y, *ilist, jax_fn=jax_fn):
+        return jax_fn(x, ilist, y)
+    return advancedincsubtensor
+@jax_funcify.register(FunctionGraph)
+def jax_funcify_FunctionGraph(
+    fgraph, order=None, input_storage=None, output_storage=None, storage_map=None
+):
+    if order is None:
+        order = fgraph.toposort()
+    input_storage, output_storage, storage_map = map_storage(
+        fgraph, order, input_storage, output_storage, storage_map
+    )
+    global_env = {}
+    fgraph_name = "jax_funcified_fgraph"
+    def unique_name(x, names_counter=Counter([fgraph_name]), obj_to_names={}):
+        if x in obj_to_names:
+            return obj_to_names[x]
+        if isinstance(x, Variable):
+            name = re.sub("[^0-9a-zA-Z]+", "_", x.name) if x.name else ""
+            name = (
+                name if (name.isidentifier() and not iskeyword(name)) else x.auto_name
+            )
+        elif isinstance(x, FunctionType):
+            name = x.__name__
+        else:
+            name = type(x).__name__
+        name_suffix = names_counter.get(name, "")
+        local_name = f"{name}{name_suffix}"
+        names_counter.update((name,))
+        obj_to_names[x] = local_name
+        return local_name
+    body_assigns = []
+    for node in order:
+        jax_func = jax_funcify(node.op)
+        # Create a local alias with a unique name
+        local_jax_func_name = unique_name(jax_func)
+        global_env[local_jax_func_name] = jax_func
+        node_input_names = []
+        for i in node.inputs:
+            local_input_name = unique_name(i)
+            if storage_map[i][0] is not None or isinstance(i, Constant):
+                # Constants need to be assigned locally and referenced
+                global_env[local_input_name] = jax_typify(storage_map[i][0], None)
+                # TODO: We could attempt to use the storage arrays directly
+                # E.g. `local_input_name = f"{local_input_name}[0]"`
+            node_input_names.append(local_input_name)
+        node_output_names = [unique_name(v) for v in node.outputs]
+        body_assigns.append(
+            f"{', '.join(node_output_names)} = {local_jax_func_name}({', '.join(node_input_names)})"
+        )
+    fgraph_input_names = [unique_name(v) for v in fgraph.inputs]
+    fgraph_output_names = [unique_name(v) for v in fgraph.outputs]
+    joined_body_assigns = indent("\n".join(body_assigns), "    ")
+    if len(fgraph_output_names) == 1:
+        fgraph_return_src = f"({fgraph_output_names[0]},)"
+    else:
+        fgraph_return_src = ", ".join(fgraph_output_names)
+    fgraph_def_src = f"""
+def {fgraph_name}({", ".join(fgraph_input_names)}):
+{joined_body_assigns}
+    return {fgraph_return_src}
+    """
+    fgraph_def_ast = ast.parse(fgraph_def_src)
+    # Create source code to be (at least temporarily) associated with the
+    # compiled function (e.g. for easier debugging)
+    with NamedTemporaryFile(delete=False) as f:
+        filename = f.name
+        f.write(fgraph_def_src.encode())
+    mod_code = compile(fgraph_def_ast, filename, mode="exec")
+    exec(mod_code, global_env, locals())
+    fgraph_def = locals()[fgraph_name]
+    return fgraph_def
+@jax_funcify.register(CAReduce)
+def jax_funcify_CAReduce(op):
+    axis = op.axis
+    op_nfunc_spec = getattr(op, "nfunc_spec", None)
+    scalar_nfunc_spec = getattr(op.scalar_op, "nfunc_spec", None)
+    scalar_op_name = getattr(op.scalar_op, "name", None)
+    scalar_op_identity = getattr(op.scalar_op, "identity", None)
+    acc_dtype = getattr(op, "acc_dtype", None)
+    def careduce(x):
+        nonlocal axis, op_nfunc_spec, scalar_nfunc_spec, scalar_op_name, scalar_op_identity, acc_dtype
+        if axis is None:
+            axis = list(range(x.ndim))
+        if acc_dtype is None:
+            acc_dtype = x.dtype.type
+        if op_nfunc_spec:
+            jax_op = getattr(jnp, op_nfunc_spec[0])
+            return jax_op(x, axis=axis).astype(acc_dtype)
+        # The Aesara `Op` didn't tell us which NumPy equivalent to use (or
+        # there isn't one), so we use this fallback approach
+        if scalar_nfunc_spec:
+            scalar_fn_name = scalar_nfunc_spec[0]
+        elif scalar_op_name:
+            scalar_fn_name = scalar_op_name
+        to_reduce = reversed(sorted(axis))
+        if to_reduce:
+            # In this case, we need to use the `jax.lax` function (if there
+            # is one), and not the `jnp` version.
+            jax_op = getattr(jax.lax, scalar_fn_name)
+            init_value = jnp.array(scalar_op_identity, dtype=acc_dtype)
+            return jax.lax.reduce(x, init_value, jax_op, to_reduce).astype(acc_dtype)
+        else:
+            return x
+    return careduce
+@jax_funcify.register(MakeVector)
+def jax_funcify_MakeVector(op):
+    def makevector(*x):
+        return jnp.array(x, dtype=op.dtype)
+    return makevector
+@jax_funcify.register(Reshape)
+def jax_funcify_Reshape(op):
+    def reshape(x, shape):
+        return jnp.reshape(x, shape)
+    return reshape
+@jax_funcify.register(DimShuffle)
+def jax_funcify_DimShuffle(op):
+    def dimshuffle(x):
+        res = jnp.transpose(x, op.shuffle + op.drop)
+        shape = list(res.shape[: len(op.shuffle)])
+        for augm in op.augment:
+            shape.insert(augm, 1)
+        res = jnp.reshape(res, shape)
+        if not op.inplace:
+            res = jnp_safe_copy(res)
+        return res
+    return dimshuffle
+@jax_funcify.register(Join)
+def jax_funcify_Join(op):
+    def join(axis, *tensors):
+        # tensors could also be tuples, and in this case they don't have a ndim
+        tensors = [jnp.asarray(tensor) for tensor in tensors]
+        view = op.view
+        if (view != -1) and all(
+            [
+                tensor.shape[axis] == 0
+                for tensor in tensors[0:view] + tensors[view + 1 :]
+            ]
+        ):
+            return tensors[view]
+        else:
+            ndim = tensors[0].ndim
+            if axis < -ndim:
+                raise IndexError(
+                    f"Join axis {int(axis)} out of bounds [0, {int(ndim)})"
+                )
+            return jnp.concatenate(tensors, axis=axis)
+    return join
+@jax_funcify.register(MaxAndArgmax)
+def jax_funcify_MaxAndArgmax(op):
+    axis = op.axis
+    def maxandargmax(x, axis=axis):
+        if axis is None:
+            axes = tuple(range(x.ndim))
+        else:
+            axes = tuple(int(ax) for ax in axis)
+        max_res = jnp.max(x, axis)
+        # NumPy does not support multiple axes for argmax; this is a
+        # work-around
+        keep_axes = jnp.array(
+            [i for i in range(x.ndim) if i not in axes], dtype="int64"
+        )
+        # Not-reduced axes in front
+        transposed_x = jnp.transpose(
+            x, jnp.concatenate((keep_axes, jnp.array(axes, dtype="int64")))
+        )
+        kept_shape = transposed_x.shape[: len(keep_axes)]
+        reduced_shape = transposed_x.shape[len(keep_axes) :]
+        # Numpy.prod returns 1.0 when arg is empty, so we cast it to int64
+        # Otherwise reshape would complain citing float arg
+        new_shape = kept_shape + (
+            jnp.prod(jnp.array(reduced_shape, dtype="int64"), dtype="int64"),
+        )
+        reshaped_x = transposed_x.reshape(new_shape)
+        max_idx_res = jnp.argmax(reshaped_x, axis=-1).astype("int64")
+        return max_res, max_idx_res
+    return maxandargmax
+@jax_funcify.register(ExtractDiag)
+def jax_funcify_ExtractDiag(op):
+    offset = op.offset
+    axis1 = op.axis1
+    axis2 = op.axis2
+    def extract_diag(x, offset=offset, axis1=axis1, axis2=axis2):
+        return jnp.diagonal(x, offset=offset, axis1=axis1, axis2=axis2)
+    return extract_diag
+@jax_funcify.register(Cholesky)
+def jax_funcify_Cholesky(op):
+    lower = op.lower
+    def cholesky(a, lower=lower):
+        return jsp.linalg.cholesky(a, lower=lower).astype(a.dtype)
+    return cholesky
+@jax_funcify.register(Solve)
+def jax_funcify_Solve(op):
+    if op.A_structure == "lower_triangular":
+        lower = True
+    else:
+        lower = False
+    def solve(a, b, lower=lower):
+        return jsp.linalg.solve(a, b, lower=lower)
+    return solve
+@jax_funcify.register(Det)
+def jax_funcify_Det(op):
+    def det(x):
+        return jnp.linalg.det(x)
+    return det
+@jax_funcify.register(Eig)
+def jax_funcify_Eig(op):
+    def eig(x):
+        return jnp.linalg.eig(x)
+    return eig
+@jax_funcify.register(Eigh)
+def jax_funcify_Eigh(op):
+    uplo = op.UPLO
+    def eigh(x, uplo=uplo):
+        return jnp.linalg.eigh(x, UPLO=uplo)
+    return eigh
+@jax_funcify.register(MatrixInverse)
+def jax_funcify_MatrixInverse(op):
+    def matrix_inverse(x):
+        return jnp.linalg.inv(x)
+    return matrix_inverse
+@jax_funcify.register(QRFull)
+def jax_funcify_QRFull(op):
+    mode = op.mode
+    def qr_full(x, mode=mode):
+        return jnp.linalg.qr(x, mode=mode)
+    return qr_full
+@jax_funcify.register(QRIncomplete)
+def jax_funcify_QRIncomplete(op):
+    mode = op.mode
+    def qr_incomplete(x, mode=mode):
+        return jnp.linalg.qr(x, mode=mode)
+    return qr_incomplete
+@jax_funcify.register(SVD)
+def jax_funcify_SVD(op):
+    full_matrices = op.full_matrices
+    compute_uv = op.compute_uv
+    def svd(x, full_matrices=full_matrices, compute_uv=compute_uv):
+        return jnp.linalg.svd(x, full_matrices=full_matrices, compute_uv=compute_uv)
+    return svd
+@jax_funcify.register(CumOp)
+def jax_funcify_CumOp(op):
+    axis = op.axis
+    mode = op.mode
+    def cumop(x, axis=axis, mode=mode):
+        if mode == "add":
+            return jnp.cumsum(x, axis=axis)
+        else:
+            return jnp.cumprod(x, axis=axis)
+    return cumop
+@jax_funcify.register(DiffOp)
+def jax_funcify_DiffOp(op):
+    n = op.n
+    axis = op.axis
+    def diffop(x, n=n, axis=axis):
+        return jnp.diff(x, n=n, axis=axis)
+    return diffop
+@jax_funcify.register(RepeatOp)
+def jax_funcify_RepeatOp(op):
+    axis = op.axis
+    def repeatop(x, repeats, axis=axis):
+        return jnp.repeat(x, repeats, axis=axis)
+    return repeatop
+@jax_funcify.register(Bartlett)
+def jax_funcify_Bartlett(op):
+    def bartlett(x):
+        return jnp.bartlett(x)
+    return bartlett
+@jax_funcify.register(FillDiagonal)
+def jax_funcify_FillDiagonal(op):
+    # def filldiagonal(a, val):
+    #     if a.ndim == 2:
+    #         step = a.shape[1] + 1
+    #         end = a.shape[1] * a.shape[1]
+    #         a.flat[:end:step] = val
+    #     else:
+    #         jnp.fill_diagonal(a, val)
+    #
+    #     return a
+    #
+    # return filldiagonal
+    raise NotImplementedError("flatiter not implemented in JAX")
+@jax_funcify.register(FillDiagonalOffset)
+def jax_funcify_FillDiagonalOffset(op):
+    # def filldiagonaloffset(a, val, offset):
+    #     height, width = a.shape
+    #
+    #     if offset >= 0:
+    #         start = offset
+    #         num_of_step = min(min(width, height), width - offset)
+    #     else:
+    #         start = -offset * a.shape[1]
+    #         num_of_step = min(min(width, height), height + offset)
+    #
+    #     step = a.shape[1] + 1
+    #     end = start + step * num_of_step
+    #     a.flat[start:end:step] = val
+    #
+    #     return a
+    #
+    # return filldiagonaloffset
+    raise NotImplementedError("flatiter not implemented in JAX")
+@jax_funcify.register(Unique)
+def jax_funcify_Unique(op):
+    axis = op.axis
+    if axis is not None:
+        raise NotImplementedError(
+            "jax.numpy.unique is not implemented for the axis argument"
+        )
+    return_index = op.return_index
+    return_inverse = op.return_inverse
+    return_counts = op.return_counts
+    def unique(
+        x,
+        return_index=return_index,
+        return_inverse=return_inverse,
+        return_counts=return_counts,
+        axis=axis,
+    ):
+        ret = jnp.lax_numpy._unique1d(x, return_index, return_inverse, return_counts)
+        if len(ret) == 1:
+            return ret[0]
+        else:
+            return ret
+    return unique
+@jax_funcify.register(UnravelIndex)
+def jax_funcify_UnravelIndex(op):
+    order = op.order
+    warn("JAX ignores the `order` parameter in `unravel_index`.")
+    def unravelindex(indices, dims, order=order):
+        return jnp.unravel_index(indices, dims)
+    return unravelindex
+@jax_funcify.register(RavelMultiIndex)
+def jax_funcify_RavelMultiIndex(op):
+    mode = op.mode
+    order = op.order
+    def ravelmultiindex(*inp, mode=mode, order=order):
+        multi_index, dims = inp[:-1], inp[-1]
+        return jnp.ravel_multi_index(multi_index, dims, mode=mode, order=order)
+    return ravelmultiindex
+@jax_funcify.register(Eye)
+def jax_funcify_Eye(op):
+    dtype = op.dtype
+    def eye(N, M, k):
+        return jnp.eye(N, M, k, dtype=dtype)
+    return eye
+@jax_funcify.register(BatchedDot)
+def jax_funcify_BatchedDot(op):
+    def batched_dot(a, b):
+        if a.shape[0] != b.shape[0]:
+            raise TypeError("Shapes must match in the 0-th dimension")
+        if a.ndim == 2 or b.ndim == 2:
+            return jnp.einsum("n...j,nj...->n...", a, b)
+        return jnp.einsum("nij,njk->nik", a, b)
+    return batched_dot
+@jax_funcify.register(RandomVariable)
+def jax_funcify_RandomVariable(op):
+    name = op.name
+    if not hasattr(jax.random, name):
+        raise NotImplementedError(
+            f"No JAX conversion for the given distribution: {name}"
+        )
+    def random_variable(rng, size, dtype, *args):
+        prng = jax.random.PRNGKey(rng["state"]["key"][0])
+        dtype = jnp.dtype(dtype)
+        data = getattr(jax.random, name)(key=prng, shape=size)
+        smpl_value = jnp.array(data, dtype=dtype)
+        prng = jax.random.split(prng, num=1)[0]
+        jax.ops.index_update(rng["state"]["key"], 0, prng[0])
+        return (rng, smpl_value)
+    return random_variable
--- a/aesara/link/jax/jax_dispatch.py
+++ b/aesara/link/jax/jax_dispatch.py
-import ast
-import re
 import warnings
-from collections import Counter
-from functools import reduce, singledispatch
-from keyword import iskeyword
-from tempfile import NamedTemporaryFile
-from textwrap import indent
-from types import FunctionType
-from warnings import warn
-import jax
-import jax.numpy as jnp
-import jax.scipy as jsp
-import numpy as np
-from numpy.random import RandomState
-from aesara.compile.ops import DeepCopyOp, ViewOp
+warnings.warn(
-from aesara.configdefaults import config
+    "The module `aesara.link.jax.jax_dispatch` is deprecated "
-from aesara.graph.basic import Constant, Variable
+    "and has been renamed to `aesara.link.jax.dispatch`",
-from aesara.graph.fg import FunctionGraph
+    DeprecationWarning,
-from aesara.ifelse import IfElse
+    stacklevel=2,
-from aesara.link.utils import map_storage
-from aesara.scalar.basic import Cast, Clip, Composite, Identity, ScalarOp, Second
-from aesara.scan.op import Scan
-from aesara.scan.utils import scan_args as ScanArgs
-from aesara.tensor.basic import (
-    Alloc,
-    AllocDiag,
-    AllocEmpty,
-    ARange,
-    ExtractDiag,
-    Eye,
-    Join,
-    MakeVector,
-    Rebroadcast,
-    ScalarFromTensor,
-    TensorFromScalar,
 )
-from aesara.tensor.blas import BatchedDot
-from aesara.tensor.elemwise import CAReduce, DimShuffle, Elemwise
-from aesara.tensor.extra_ops import (
-    Bartlett,
-    CumOp,
-    DiffOp,
-    FillDiagonal,
-    FillDiagonalOffset,
-    RavelMultiIndex,
-    RepeatOp,
-    Unique,
-    UnravelIndex,
-)
-from aesara.tensor.math import Dot, MaxAndArgmax
-from aesara.tensor.nlinalg import (
-    SVD,
-    Det,
-    Eig,
-    Eigh,
-    MatrixInverse,
-    QRFull,
-    QRIncomplete,
-)
-from aesara.tensor.nnet.basic import LogSoftmax, Softmax
-from aesara.tensor.nnet.sigm import ScalarSoftplus
-from aesara.tensor.random.op import RandomVariable
-from aesara.tensor.shape import Reshape, Shape, Shape_i, SpecifyShape
-from aesara.tensor.slinalg import Cholesky, Solve
-from aesara.tensor.subtensor import (
-    AdvancedIncSubtensor,
-    AdvancedIncSubtensor1,
-    AdvancedSubtensor,
-    AdvancedSubtensor1,
-    IncSubtensor,
-    Subtensor,
-    indices_from_subtensor,
-)
-from aesara.tensor.type_other import MakeSlice
-# For use with JAX since JAX doesn't support 'str' arguments
-numpy_bit_gens = {"MT19937": 0, "PCG64": 1, "Philox": 2, "SFC64": 3}
-if config.floatX == "float64":
-    jax.config.update("jax_enable_x64", True)
-else:
-    jax.config.update("jax_enable_x64", False)
-# XXX: Enabling this will break some shape-based functionality, and severely
-# limit the types of graphs that can be converted.
-# See https://github.com/google/jax/blob/4d556837cc9003492f674c012689efc3d68fdf5f/design_notes/omnistaging.md
-# Older versions < 0.2.0 do not have this flag so we don't need to set it.
-try:
-    jax.config.disable_omnistaging()
-except AttributeError:
-    pass
-except Exception as e:
-    # The version might be >= 0.2.12, which means that omnistaging can't be
-    # disabled
-    warnings.warn(f"JAX omnistaging couldn't be disabled: {e}")
-subtensor_ops = (Subtensor, AdvancedSubtensor1, AdvancedSubtensor)
-incsubtensor_ops = (IncSubtensor, AdvancedIncSubtensor1)
-@singledispatch
-def jax_typify(data, dtype):
-    """Convert instances of Aesara `Type`s to JAX types."""
-    if dtype is None:
-        return data
-    else:
-        return jnp.array(data, dtype=dtype)
-@jax_typify.register(np.ndarray)
-def jax_typify_ndarray(data, dtype):
-    return jnp.array(data, dtype=dtype)
-@jax_typify.register(RandomState)
-def jax_typify_RandomState(state, dtype):
-    state = state.get_state(legacy=False)
-    state["bit_generator"] = numpy_bit_gens[state["bit_generator"]]
-    return state
-@singledispatch
-def jax_funcify(op, **kwargs):
-    """Create a JAX compatible function from an Aesara `Op`."""
-    raise NotImplementedError(f"No JAX conversion for the given `Op`: {op}")
-@jax_funcify.register(MakeSlice)
-def jax_funcify_MakeSlice(op):
-    def makeslice(*x):
-        return slice(*x)
-    return makeslice
-@jax_funcify.register(ScalarOp)
-def jax_funcify_ScalarOp(op):
-    func_name = op.nfunc_spec[0]
-    if "." in func_name:
-        jnp_func = reduce(getattr, [jax] + func_name.split("."))
-    else:
-        jnp_func = getattr(jnp, func_name)
-    if hasattr(op, "nfunc_variadic"):
-        # These are special cases that handle invalid arities due to the broken
-        # Aesara `Op` type contract (e.g. binary `Op`s that also function as
-        # their own variadic counterparts--even when those counterparts already
-        # exist as independent `Op`s).
-        jax_variadic_func = getattr(jnp, op.nfunc_variadic)
-        def elemwise(*args):
-            if len(args) > op.nfunc_spec[1]:
-                return jax_variadic_func(
-                    jnp.stack(jnp.broadcast_arrays(*args), axis=0), axis=0
-                )
-            else:
-                return jnp_func(*args)
-        return elemwise
-    else:
-        return jnp_func
-@jax_funcify.register(Clip)
-def jax_funcify_Clip(op):
-    def clip(x, min, max):
-        return jnp.where(x < min, min, jnp.where(x > max, max, x))
-    return clip
-@jax_funcify.register(Identity)
-def jax_funcify_Identity(op):
-    def identity(x):
-        return x
-    return identity
-@jax_funcify.register(Softmax)
-def jax_funcify_Softmax(op):
-    def softmax(x):
-        return jax.nn.softmax(x)
-    return softmax
-@jax_funcify.register(LogSoftmax)
-def jax_funcify_LogSoftmax(op):
-    def log_softmax(x):
-        return jax.nn.log_softmax(x)
-    return log_softmax
-@jax_funcify.register(ScalarSoftplus)
-def jax_funcify_ScalarSoftplus(op):
-    def scalarsoftplus(x):
-        return jnp.where(x < -30.0, 0.0, jnp.where(x > 30.0, x, jnp.log1p(jnp.exp(x))))
-    return scalarsoftplus
-@jax_funcify.register(Second)
-def jax_funcify_Second(op):
-    def second(x, y):
-        return jnp.broadcast_to(y, x.shape)
-    return second
-@jax_funcify.register(AllocDiag)
-def jax_funcify_AllocDiag(op):
-    offset = op.offset
-    def allocdiag(v, offset=offset):
-        return jnp.diag(v, k=offset)
-    return allocdiag
-@jax_funcify.register(AllocEmpty)
-def jax_funcify_AllocEmpty(op):
-    def allocempty(*shape):
-        return jnp.empty(shape, dtype=op.dtype)
-    return allocempty
-@jax_funcify.register(Alloc)
-def jax_funcify_Alloc(op):
-    def alloc(x, *shape):
-        res = jnp.broadcast_to(x, shape)
-        return res
-    return alloc
-@jax_funcify.register(Dot)
-def jax_funcify_Dot(op):
-    def dot(x, y):
-        return jnp.dot(x, y)
-    return dot
-@jax_funcify.register(ARange)
-def jax_funcify_ARange(op):
-    # XXX: This currently requires concrete arguments.
-    def arange(start, stop, step):
-        return jnp.arange(start, stop, step, dtype=op.dtype)
-    return arange
-def jnp_safe_copy(x):
-    try:
-        res = jnp.copy(x)
-    except NotImplementedError:
-        warn("`jnp.copy` is not implemented yet. " "Using the object's `copy` method.")
-        if hasattr(x, "copy"):
-            res = jnp.array(x.copy())
-        else:
-            warn(f"Object has no `copy` method: {x}")
-            res = x
-    return res
-@jax_funcify.register(DeepCopyOp)
-def jax_funcify_DeepCopyOp(op):
-    def deepcopyop(x):
-        return jnp_safe_copy(x)
-    return deepcopyop
-@jax_funcify.register(Shape)
-def jax_funcify_Shape(op):
-    def shape(x):
-        return jnp.shape(x)
-    return shape
-@jax_funcify.register(Shape_i)
-def jax_funcify_Shape_i(op):
-    i = op.i
-    def shape_i(x):
-        return jnp.shape(x)[i]
-    return shape_i
-@jax_funcify.register(SpecifyShape)
-def jax_funcify_SpecifyShape(op):
-    def specifyshape(x, shape):
-        assert x.ndim == len(shape)
-        assert jnp.all(x.shape == tuple(shape)), (
-            "got shape",
-            x.shape,
-            "expected",
-            shape,
-        )
-        return x
-    return specifyshape
-@jax_funcify.register(Rebroadcast)
-def jax_funcify_Rebroadcast(op):
-    op_axis = op.axis
-    def rebroadcast(x):
-        for axis, value in op_axis.items():
-            if value and x.shape[axis] != 1:
-                raise ValueError(
-                    "Dimension %s in Rebroadcast's input was"
-                    " supposed to be 1 (got %s instead)" % (axis, x.shape[axis])
-                )
-        return x
-    return rebroadcast
-@jax_funcify.register(ViewOp)
-def jax_funcify_ViewOp(op):
-    def viewop(x):
-        return x
-    return viewop
-@jax_funcify.register(Cast)
-def jax_funcify_Cast(op):
-    def cast(x):
-        return jnp.array(x).astype(op.o_type.dtype)
-    return cast
-@jax_funcify.register(TensorFromScalar)
-def jax_funcify_TensorFromScalar(op):
-    def tensor_from_scalar(x):
-        return jnp.array(x)
-    return tensor_from_scalar
-@jax_funcify.register(ScalarFromTensor)
-def jax_funcify_ScalarFromTensor(op):
-    def scalar_from_tensor(x):
-        return jnp.array(x).flatten()[0]
-    return scalar_from_tensor
-@jax_funcify.register(Elemwise)
-def jax_funcify_Elemwise(op):
-    scalar_op = op.scalar_op
-    return jax_funcify(scalar_op)
-@jax_funcify.register(Composite)
-def jax_funcify_Composite(op):
-    # This approach basically gets rid of the fused `Elemwise` by turning each
-    # `Op` in the `Composite` back into individually broadcasted NumPy-like
-    # operations.
-    # TODO: A better approach would involve something like `jax.vmap` or some
-    # other operation that can perform the broadcasting that `Elemwise` does.
-    jax_impl = jax_funcify(op.fgraph)
-    def composite(*args):
-        return jax_impl(*args)[0]
-    return composite
-@jax_funcify.register(Scan)
-def jax_funcify_Scan(op):
-    inner_fg = FunctionGraph(op.inputs, op.outputs)
-    jax_aet_inner_func = jax_funcify(inner_fg)
-    def scan(*outer_inputs):
-        scan_args = ScanArgs(
-            list(outer_inputs), [None] * op.n_outs, op.inputs, op.outputs, op.info
-        )
-        # `outer_inputs` is a list with the following composite form:
-        # [n_steps]
-        # + outer_in_seqs
-        # + outer_in_mit_mot
-        # + outer_in_mit_sot
-        # + outer_in_sit_sot
-        # + outer_in_shared
-        # + outer_in_nit_sot
-        # + outer_in_non_seqs
-        n_steps = scan_args.n_steps
-        seqs = scan_args.outer_in_seqs
-        # TODO: mit_mots
-        mit_mot_in_slices = []
-        mit_sot_in_slices = []
-        for tap, seq in zip(scan_args.mit_sot_in_slices, scan_args.outer_in_mit_sot):
-            neg_taps = [abs(t) for t in tap if t < 0]
-            pos_taps = [abs(t) for t in tap if t > 0]
-            max_neg = max(neg_taps) if neg_taps else 0
-            max_pos = max(pos_taps) if pos_taps else 0
-            init_slice = seq[: max_neg + max_pos]
-            mit_sot_in_slices.append(init_slice)
-        sit_sot_in_slices = [seq[0] for seq in scan_args.outer_in_sit_sot]
-        init_carry = (
-            mit_mot_in_slices,
-            mit_sot_in_slices,
-            sit_sot_in_slices,
-            scan_args.outer_in_shared,
-            scan_args.outer_in_non_seqs,
-        )
-        def jax_args_to_inner_scan(op, carry, x):
-            # `carry` contains all inner-output taps, non_seqs, and shared
-            # terms
-            (
-                inner_in_mit_mot,
-                inner_in_mit_sot,
-                inner_in_sit_sot,
-                inner_in_shared,
-                inner_in_non_seqs,
-            ) = carry
-            # `x` contains the in_seqs
-            inner_in_seqs = x
-            # `inner_scan_inputs` is a list with the following composite form:
-            # inner_in_seqs
-            # + sum(inner_in_mit_mot, [])
-            # + sum(inner_in_mit_sot, [])
-            # + inner_in_sit_sot
-            # + inner_in_shared
-            # + inner_in_non_seqs
-            inner_in_mit_sot_flatten = []
-            for array, index in zip(inner_in_mit_sot, scan_args.mit_sot_in_slices):
-                inner_in_mit_sot_flatten.extend(array[jnp.array(index)])
-            inner_scan_inputs = sum(
-                [
-                    inner_in_seqs,
-                    inner_in_mit_mot,
-                    inner_in_mit_sot_flatten,
-                    inner_in_sit_sot,
-                    inner_in_shared,
-                    inner_in_non_seqs,
-                ],
-                [],
-            )
-            return inner_scan_inputs
-        def inner_scan_outs_to_jax_outs(
-            op,
-            old_carry,
-            inner_scan_outs,
-        ):
-            (
-                inner_in_mit_mot,
-                inner_in_mit_sot,
-                inner_in_sit_sot,
-                inner_in_shared,
-                inner_in_non_seqs,
-            ) = old_carry
-            def update_mit_sot(mit_sot, new_val):
-                return jnp.concatenate([mit_sot[1:], new_val[None, ...]], axis=0)
-            inner_out_mit_sot = [
-                update_mit_sot(mit_sot, new_val)
-                for mit_sot, new_val in zip(inner_in_mit_sot, inner_scan_outs)
-            ]
-            # This should contain all inner-output taps, non_seqs, and shared
-            # terms
-            if not inner_in_sit_sot:
-                inner_out_sit_sot = []
-            else:
-                inner_out_sit_sot = inner_scan_outs
-            new_carry = (
-                inner_in_mit_mot,
-                inner_out_mit_sot,
-                inner_out_sit_sot,
-                inner_in_shared,
-                inner_in_non_seqs,
-            )
-            return new_carry
-        def jax_inner_func(carry, x):
-            inner_args = jax_args_to_inner_scan(op, carry, x)
-            inner_scan_outs = [fn(*inner_args) for fn in jax_aet_inner_func]
-            new_carry = inner_scan_outs_to_jax_outs(op, carry, inner_scan_outs)
-            return new_carry, inner_scan_outs
-        _, scan_out = jax.lax.scan(jax_inner_func, init_carry, seqs, length=n_steps)
-        # We need to prepend the initial values so that the JAX output will
-        # match the raw `Scan` `Op` output and, thus, work with a downstream
-        # `Subtensor` `Op` introduced by the `scan` helper function.
-        def append_scan_out(scan_in_part, scan_out_part):
-            return jnp.concatenate([scan_in_part[:-n_steps], scan_out_part], axis=0)
-        if scan_args.outer_in_mit_sot:
-            scan_out_final = [
-                append_scan_out(init, out)
-                for init, out in zip(scan_args.outer_in_mit_sot, scan_out)
-            ]
-        elif scan_args.outer_in_sit_sot:
-            scan_out_final = [
-                append_scan_out(init, out)
-                for init, out in zip(scan_args.outer_in_sit_sot, scan_out)
-            ]
-        if len(scan_out_final) == 1:
-            scan_out_final = scan_out_final[0]
-        return scan_out_final
-    return scan
-@jax_funcify.register(IfElse)
-def jax_funcify_IfElse(op):
-    n_outs = op.n_outs
-    def ifelse(cond, *args, n_outs=n_outs):
-        res = jax.lax.cond(
-            cond, lambda _: args[:n_outs], lambda _: args[n_outs:], operand=None
-        )
-        return res if n_outs > 1 else res[0]
-    return ifelse
-@jax_funcify.register(Subtensor)
-def jax_funcify_Subtensor(op):
-    idx_list = getattr(op, "idx_list", None)
-    def subtensor(x, *ilists):
-        indices = indices_from_subtensor(ilists, idx_list)
-        if len(indices) == 1:
-            indices = indices[0]
-        return x.__getitem__(indices)
-    return subtensor
-_ = [jax_funcify.register(op, jax_funcify_Subtensor) for op in subtensor_ops]
-def jax_funcify_IncSubtensor(op):
-    idx_list = getattr(op, "idx_list", None)
-    if getattr(op, "set_instead_of_inc", False):
-        jax_fn = jax.ops.index_update
-    else:
-        jax_fn = jax.ops.index_add
-    def incsubtensor(x, y, *ilist, jax_fn=jax_fn, idx_list=idx_list):
-        indices = indices_from_subtensor(ilist, idx_list)
-        if len(indices) == 1:
-            indices = indices[0]
-        return jax_fn(x, indices, y)
-    return incsubtensor
-_ = [jax_funcify.register(op, jax_funcify_IncSubtensor) for op in incsubtensor_ops]
-@jax_funcify.register(AdvancedIncSubtensor)
-def jax_funcify_AdvancedIncSubtensor(op):
-    if getattr(op, "set_instead_of_inc", False):
-        jax_fn = jax.ops.index_update
-    else:
-        jax_fn = jax.ops.index_add
-    def advancedincsubtensor(x, y, *ilist, jax_fn=jax_fn):
-        return jax_fn(x, ilist, y)
-    return advancedincsubtensor
-@jax_funcify.register(FunctionGraph)
-def jax_funcify_FunctionGraph(
-    fgraph, order=None, input_storage=None, output_storage=None, storage_map=None
-):
-    if order is None:
-        order = fgraph.toposort()
-    input_storage, output_storage, storage_map = map_storage(
-        fgraph, order, input_storage, output_storage, storage_map
-    )
-    global_env = {}
-    fgraph_name = "jax_funcified_fgraph"
-    def unique_name(x, names_counter=Counter([fgraph_name]), obj_to_names={}):
-        if x in obj_to_names:
-            return obj_to_names[x]
-        if isinstance(x, Variable):
-            name = re.sub("[^0-9a-zA-Z]+", "_", x.name) if x.name else ""
-            name = (
-                name if (name.isidentifier() and not iskeyword(name)) else x.auto_name
-            )
-        elif isinstance(x, FunctionType):
-            name = x.__name__
-        else:
-            name = type(x).__name__
-        name_suffix = names_counter.get(name, "")
-        local_name = f"{name}{name_suffix}"
-        names_counter.update((name,))
-        obj_to_names[x] = local_name
-        return local_name
-    body_assigns = []
-    for node in order:
-        jax_func = jax_funcify(node.op)
-        # Create a local alias with a unique name
-        local_jax_func_name = unique_name(jax_func)
-        global_env[local_jax_func_name] = jax_func
-        node_input_names = []
-        for i in node.inputs:
-            local_input_name = unique_name(i)
-            if storage_map[i][0] is not None or isinstance(i, Constant):
-                # Constants need to be assigned locally and referenced
-                global_env[local_input_name] = jax_typify(storage_map[i][0], None)
-                # TODO: We could attempt to use the storage arrays directly
-                # E.g. `local_input_name = f"{local_input_name}[0]"`
-            node_input_names.append(local_input_name)
-        node_output_names = [unique_name(v) for v in node.outputs]
-        body_assigns.append(
-            f"{', '.join(node_output_names)} = {local_jax_func_name}({', '.join(node_input_names)})"
-        )
-    fgraph_input_names = [unique_name(v) for v in fgraph.inputs]
-    fgraph_output_names = [unique_name(v) for v in fgraph.outputs]
-    joined_body_assigns = indent("\n".join(body_assigns), "    ")
-    if len(fgraph_output_names) == 1:
-        fgraph_return_src = f"({fgraph_output_names[0]},)"
-    else:
-        fgraph_return_src = ", ".join(fgraph_output_names)
-    fgraph_def_src = f"""
-def {fgraph_name}({", ".join(fgraph_input_names)}):
-{joined_body_assigns}
-    return {fgraph_return_src}
-    """
-    fgraph_def_ast = ast.parse(fgraph_def_src)
-    # Create source code to be (at least temporarily) associated with the
-    # compiled function (e.g. for easier debugging)
-    with NamedTemporaryFile(delete=False) as f:
-        filename = f.name
-        f.write(fgraph_def_src.encode())
-    mod_code = compile(fgraph_def_ast, filename, mode="exec")
-    exec(mod_code, global_env, locals())
-    fgraph_def = locals()[fgraph_name]
-    return fgraph_def
-@jax_funcify.register(CAReduce)
-def jax_funcify_CAReduce(op):
-    axis = op.axis
-    op_nfunc_spec = getattr(op, "nfunc_spec", None)
-    scalar_nfunc_spec = getattr(op.scalar_op, "nfunc_spec", None)
-    scalar_op_name = getattr(op.scalar_op, "name", None)
-    scalar_op_identity = getattr(op.scalar_op, "identity", None)
-    acc_dtype = getattr(op, "acc_dtype", None)
-    def careduce(x):
-        nonlocal axis, op_nfunc_spec, scalar_nfunc_spec, scalar_op_name, scalar_op_identity, acc_dtype
-        if axis is None:
-            axis = list(range(x.ndim))
-        if acc_dtype is None:
-            acc_dtype = x.dtype.type
-        if op_nfunc_spec:
-            jax_op = getattr(jnp, op_nfunc_spec[0])
-            return jax_op(x, axis=axis).astype(acc_dtype)
-        # The Aesara `Op` didn't tell us which NumPy equivalent to use (or
-        # there isn't one), so we use this fallback approach
-        if scalar_nfunc_spec:
-            scalar_fn_name = scalar_nfunc_spec[0]
-        elif scalar_op_name:
-            scalar_fn_name = scalar_op_name
-        to_reduce = reversed(sorted(axis))
-        if to_reduce:
-            # In this case, we need to use the `jax.lax` function (if there
-            # is one), and not the `jnp` version.
-            jax_op = getattr(jax.lax, scalar_fn_name)
-            init_value = jnp.array(scalar_op_identity, dtype=acc_dtype)
-            return jax.lax.reduce(x, init_value, jax_op, to_reduce).astype(acc_dtype)
-        else:
-            return x
-    return careduce
-@jax_funcify.register(MakeVector)
-def jax_funcify_MakeVector(op):
-    def makevector(*x):
-        return jnp.array(x, dtype=op.dtype)
-    return makevector
-@jax_funcify.register(Reshape)
-def jax_funcify_Reshape(op):
-    def reshape(x, shape):
-        return jnp.reshape(x, shape)
-    return reshape
-@jax_funcify.register(DimShuffle)
-def jax_funcify_DimShuffle(op):
-    def dimshuffle(x):
-        res = jnp.transpose(x, op.shuffle + op.drop)
-        shape = list(res.shape[: len(op.shuffle)])
-        for augm in op.augment:
-            shape.insert(augm, 1)
-        res = jnp.reshape(res, shape)
-        if not op.inplace:
-            res = jnp_safe_copy(res)
-        return res
-    return dimshuffle
-@jax_funcify.register(Join)
-def jax_funcify_Join(op):
-    def join(axis, *tensors):
-        # tensors could also be tuples, and in this case they don't have a ndim
-        tensors = [jnp.asarray(tensor) for tensor in tensors]
-        view = op.view
-        if (view != -1) and all(
-            [
-                tensor.shape[axis] == 0
-                for tensor in tensors[0:view] + tensors[view + 1 :]
-            ]
-        ):
-            return tensors[view]
-        else:
-            ndim = tensors[0].ndim
-            if axis < -ndim:
-                raise IndexError(
-                    f"Join axis {int(axis)} out of bounds [0, {int(ndim)})"
-                )
-            return jnp.concatenate(tensors, axis=axis)
-    return join
-@jax_funcify.register(MaxAndArgmax)
-def jax_funcify_MaxAndArgmax(op):
-    axis = op.axis
-    def maxandargmax(x, axis=axis):
-        if axis is None:
-            axes = tuple(range(x.ndim))
-        else:
-            axes = tuple(int(ax) for ax in axis)
-        max_res = jnp.max(x, axis)
-        # NumPy does not support multiple axes for argmax; this is a
-        # work-around
-        keep_axes = jnp.array(
-            [i for i in range(x.ndim) if i not in axes], dtype="int64"
-        )
-        # Not-reduced axes in front
-        transposed_x = jnp.transpose(
-            x, jnp.concatenate((keep_axes, jnp.array(axes, dtype="int64")))
-        )
-        kept_shape = transposed_x.shape[: len(keep_axes)]
-        reduced_shape = transposed_x.shape[len(keep_axes) :]
-        # Numpy.prod returns 1.0 when arg is empty, so we cast it to int64
-        # Otherwise reshape would complain citing float arg
-        new_shape = kept_shape + (
-            jnp.prod(jnp.array(reduced_shape, dtype="int64"), dtype="int64"),
-        )
-        reshaped_x = transposed_x.reshape(new_shape)
-        max_idx_res = jnp.argmax(reshaped_x, axis=-1).astype("int64")
-        return max_res, max_idx_res
-    return maxandargmax
-@jax_funcify.register(ExtractDiag)
-def jax_funcify_ExtractDiag(op):
-    offset = op.offset
-    axis1 = op.axis1
-    axis2 = op.axis2
-    def extract_diag(x, offset=offset, axis1=axis1, axis2=axis2):
-        return jnp.diagonal(x, offset=offset, axis1=axis1, axis2=axis2)
-    return extract_diag
-@jax_funcify.register(Cholesky)
-def jax_funcify_Cholesky(op):
-    lower = op.lower
-    def cholesky(a, lower=lower):
-        return jsp.linalg.cholesky(a, lower=lower).astype(a.dtype)
-    return cholesky
-@jax_funcify.register(Solve)
-def jax_funcify_Solve(op):
-    if op.A_structure == "lower_triangular":
-        lower = True
-    else:
-        lower = False
-    def solve(a, b, lower=lower):
-        return jsp.linalg.solve(a, b, lower=lower)
-    return solve
-@jax_funcify.register(Det)
-def jax_funcify_Det(op):
-    def det(x):
-        return jnp.linalg.det(x)
-    return det
-@jax_funcify.register(Eig)
-def jax_funcify_Eig(op):
-    def eig(x):
-        return jnp.linalg.eig(x)
-    return eig
-@jax_funcify.register(Eigh)
-def jax_funcify_Eigh(op):
-    uplo = op.UPLO
-    def eigh(x, uplo=uplo):
-        return jnp.linalg.eigh(x, UPLO=uplo)
-    return eigh
-@jax_funcify.register(MatrixInverse)
-def jax_funcify_MatrixInverse(op):
-    def matrix_inverse(x):
-        return jnp.linalg.inv(x)
-    return matrix_inverse
-@jax_funcify.register(QRFull)
-def jax_funcify_QRFull(op):
-    mode = op.mode
-    def qr_full(x, mode=mode):
-        return jnp.linalg.qr(x, mode=mode)
-    return qr_full
-@jax_funcify.register(QRIncomplete)
-def jax_funcify_QRIncomplete(op):
-    mode = op.mode
-    def qr_incomplete(x, mode=mode):
-        return jnp.linalg.qr(x, mode=mode)
-    return qr_incomplete
-@jax_funcify.register(SVD)
-def jax_funcify_SVD(op):
-    full_matrices = op.full_matrices
-    compute_uv = op.compute_uv
-    def svd(x, full_matrices=full_matrices, compute_uv=compute_uv):
-        return jnp.linalg.svd(x, full_matrices=full_matrices, compute_uv=compute_uv)
-    return svd
-@jax_funcify.register(CumOp)
-def jax_funcify_CumOp(op):
-    axis = op.axis
-    mode = op.mode
-    def cumop(x, axis=axis, mode=mode):
-        if mode == "add":
-            return jnp.cumsum(x, axis=axis)
-        else:
-            return jnp.cumprod(x, axis=axis)
-    return cumop
-@jax_funcify.register(DiffOp)
-def jax_funcify_DiffOp(op):
-    n = op.n
-    axis = op.axis
-    def diffop(x, n=n, axis=axis):
-        return jnp.diff(x, n=n, axis=axis)
-    return diffop
-@jax_funcify.register(RepeatOp)
-def jax_funcify_RepeatOp(op):
-    axis = op.axis
-    def repeatop(x, repeats, axis=axis):
-        return jnp.repeat(x, repeats, axis=axis)
-    return repeatop
-@jax_funcify.register(Bartlett)
-def jax_funcify_Bartlett(op):
-    def bartlett(x):
-        return jnp.bartlett(x)
-    return bartlett
-@jax_funcify.register(FillDiagonal)
-def jax_funcify_FillDiagonal(op):
-    # def filldiagonal(a, val):
-    #     if a.ndim == 2:
-    #         step = a.shape[1] + 1
-    #         end = a.shape[1] * a.shape[1]
-    #         a.flat[:end:step] = val
-    #     else:
-    #         jnp.fill_diagonal(a, val)
-    #
-    #     return a
-    #
-    # return filldiagonal
-    raise NotImplementedError("flatiter not implemented in JAX")
-@jax_funcify.register(FillDiagonalOffset)
-def jax_funcify_FillDiagonalOffset(op):
-    # def filldiagonaloffset(a, val, offset):
-    #     height, width = a.shape
-    #
-    #     if offset >= 0:
-    #         start = offset
-    #         num_of_step = min(min(width, height), width - offset)
-    #     else:
-    #         start = -offset * a.shape[1]
-    #         num_of_step = min(min(width, height), height + offset)
-    #
-    #     step = a.shape[1] + 1
-    #     end = start + step * num_of_step
-    #     a.flat[start:end:step] = val
-    #
-    #     return a
-    #
-    # return filldiagonaloffset
-    raise NotImplementedError("flatiter not implemented in JAX")
-@jax_funcify.register(Unique)
-def jax_funcify_Unique(op):
-    axis = op.axis
-    if axis is not None:
-        raise NotImplementedError(
-            "jax.numpy.unique is not implemented for the axis argument"
-        )
-    return_index = op.return_index
-    return_inverse = op.return_inverse
-    return_counts = op.return_counts
-    def unique(
-        x,
-        return_index=return_index,
-        return_inverse=return_inverse,
-        return_counts=return_counts,
-        axis=axis,
-    ):
-        ret = jnp.lax_numpy._unique1d(x, return_index, return_inverse, return_counts)
-        if len(ret) == 1:
-            return ret[0]
-        else:
-            return ret
-    return unique
-@jax_funcify.register(UnravelIndex)
-def jax_funcify_UnravelIndex(op):
-    order = op.order
-    warn("JAX ignores the `order` parameter in `unravel_index`.")
-    def unravelindex(indices, dims, order=order):
-        return jnp.unravel_index(indices, dims)
-    return unravelindex
-@jax_funcify.register(RavelMultiIndex)
-def jax_funcify_RavelMultiIndex(op):
-    mode = op.mode
-    order = op.order
-    def ravelmultiindex(*inp, mode=mode, order=order):
-        multi_index, dims = inp[:-1], inp[-1]
-        return jnp.ravel_multi_index(multi_index, dims, mode=mode, order=order)
-    return ravelmultiindex
-@jax_funcify.register(Eye)
-def jax_funcify_Eye(op):
-    dtype = op.dtype
-    def eye(N, M, k):
-        return jnp.eye(N, M, k, dtype=dtype)
-    return eye
-@jax_funcify.register(BatchedDot)
-def jax_funcify_BatchedDot(op):
-    def batched_dot(a, b):
-        if a.shape[0] != b.shape[0]:
-            raise TypeError("Shapes must match in the 0-th dimension")
-        if a.ndim == 2 or b.ndim == 2:
-            return jnp.einsum("n...j,nj...->n...", a, b)
-        return jnp.einsum("nij,njk->nik", a, b)
-    return batched_dot
-@jax_funcify.register(RandomVariable)
-def jax_funcify_RandomVariable(op):
-    name = op.name
-    if not hasattr(jax.random, name):
-        raise NotImplementedError(
-            f"No JAX conversion for the given distribution: {name}"
-        )
-    def random_variable(rng, size, dtype, *args):
-        prng = jax.random.PRNGKey(rng["state"]["key"][0])
-        dtype = jnp.dtype(dtype)
-        data = getattr(jax.random, name)(key=prng, shape=size)
-        smpl_value = jnp.array(data, dtype=dtype)
-        prng = jax.random.split(prng, num=1)[0]
-        jax.ops.index_update(rng["state"]["key"], 0, prng[0])
-        return (rng, smpl_value)
-    return random_variable
+from aesara.link.jax.dispatch import *
--- a/aesara/link/jax/jax_linker.py
+++ b/aesara/link/jax/jax_linker.py
-from warnings import warn
+import warnings
-from numpy.random import RandomState
-from aesara.graph.basic import Constant
+warnings.warn(
-from aesara.link.basic import Container, PerformLinker
+    "The module `aesara.link.jax.jax_linker` is deprecated "
-from aesara.link.utils import gc_helper, map_storage, streamline
+    "and has been renamed to `aesara.link.jax.linker`",
-from aesara.utils import difference
+    DeprecationWarning,
+    stacklevel=2,
+)
+from aesara.link.jax.linker import *
-class JAXLinker(PerformLinker):
-    """A `Linker` that JIT-compiles NumPy-based operations using JAX.
-    Attributes
-    ----------
-    allow_non_jax: bool
-        A boolean indicating whether or not an exception is thrown when the
-        graph cannot be JAX compiled (e.g. the graph has an unsupported operator).
-        If `allow_non_jax` is `True`, the fallback is currently Python compilation.
-    """
-    allow_non_jax = False
-    def create_jax_thunks(
-        self, compute_map, order, input_storage, output_storage, storage_map
-    ):
-        """Create a thunk for each output of the `Linker`s `FunctionGraph`.
-        This is differs from the other thunk-making function in that it only
-        produces thunks for the `FunctionGraph` output nodes.
-        Parameters
-        ----------
-        compute_map: dict
-            The compute map dictionary.
-        storage_map: dict
-            The storage map dictionary.
-        Returns
-        -------
-        thunks: list
-            A tuple containing the thunks.
-        output_nodes: list and their
-            A tuple containing the output nodes.
-        """
-        import jax
-        from aesara.link.jax.jax_dispatch import jax_funcify, jax_typify
-        output_nodes = [o.owner for o in self.fgraph.outputs]
-        # Create a JAX-compilable function from our `FunctionGraph`
-        jaxed_fgraph = jax_funcify(
-            self.fgraph,
-            input_storage=input_storage,
-            output_storage=output_storage,
-            storage_map=storage_map,
-        )
-        # I suppose we can consider `Constant`s to be "static" according to
-        # JAX.
-        static_argnums = [
-            n for n, i in enumerate(self.fgraph.inputs) if isinstance(i, Constant)
-        ]
-        thunk_inputs = []
-        for n in self.fgraph.inputs:
-            sinput = storage_map[n]
-            if isinstance(sinput[0], RandomState):
-                new_value = jax_typify(sinput[0], getattr(sinput[0], "dtype", None))
-                # We need to remove the reference-based connection to the
-                # original `RandomState`/shared variable's storage, because
-                # subsequent attempts to use the same shared variable within
-                # other non-JAXified graphs will have problems.
-                sinput = [new_value]
-            thunk_inputs.append(sinput)
-        thunks = []
-        thunk_outputs = [storage_map[n] for n in self.fgraph.outputs]
-        fgraph_jit = jax.jit(jaxed_fgraph, static_argnums)
-        def thunk(
-            fgraph=self.fgraph,
-            fgraph_jit=fgraph_jit,
-            thunk_inputs=thunk_inputs,
-            thunk_outputs=thunk_outputs,
-        ):
-            outputs = fgraph_jit(*[x[0] for x in thunk_inputs])
-            for o_node, o_storage, o_val in zip(fgraph.outputs, thunk_outputs, outputs):
-                compute_map[o_node][0] = True
-                if len(o_storage) > 1:
-                    assert len(o_storage) == len(o_val)
-                    for i, o_sub_val in enumerate(o_val):
-                        o_storage[i] = o_sub_val
-                else:
-                    o_storage[0] = o_val
-            return outputs
-        thunk.inputs = thunk_inputs
-        thunk.outputs = thunk_outputs
-        thunk.lazy = False
-        thunks.append(thunk)
-        # This is a bit hackish, but we only return one of the output nodes
-        return thunks, output_nodes[:1]
-    def make_all(self, input_storage=None, output_storage=None, storage_map=None):
-        fgraph = self.fgraph
-        nodes = self.schedule(fgraph)
-        no_recycling = self.no_recycling
-        input_storage, output_storage, storage_map = map_storage(
-            fgraph, nodes, input_storage, output_storage, storage_map
-        )
-        compute_map = {}
-        for k in storage_map:
-            compute_map[k] = [k.owner is None]
-        try:
-            # We need to create thunk functions that will populate the output
-            # storage arrays with the JAX-computed values.
-            thunks, nodes = self.create_jax_thunks(
-                compute_map, nodes, input_storage, output_storage, storage_map
-            )
-        except NotImplementedError as e:
-            if not self.allow_non_jax:
-                raise
-            warn(f"JaxLinker could not JAXify graph: {e}")
-            thunks = []
-            for node in nodes:
-                thunk = node.op.make_thunk(
-                    node, storage_map, compute_map, no_recycling, "py"
-                )
-                thunk_inputs = [storage_map[v] for v in node.inputs]
-                thunk_outputs = [storage_map[v] for v in node.outputs]
-                thunk.inputs = thunk_inputs
-                thunk.outputs = thunk_outputs
-                thunks.append(thunk)
-        computed, last_user = gc_helper(nodes)
-        if self.allow_gc:
-            post_thunk_old_storage = []
-            for node in nodes:
-                post_thunk_old_storage.append(
-                    [
-                        storage_map[input]
-                        for input in node.inputs
-                        if (input in computed)
-                        and (input not in fgraph.outputs)
-                        and (node == last_user[input])
-                    ]
-                )
-        else:
-            post_thunk_old_storage = None
-        if no_recycling is True:
-            no_recycling = list(storage_map.values())
-            no_recycling = difference(no_recycling, input_storage)
-        else:
-            no_recycling = [
-                storage_map[r] for r in no_recycling if r not in fgraph.inputs
-            ]
-        fn = streamline(
-            fgraph, thunks, nodes, post_thunk_old_storage, no_recycling=no_recycling
-        )
-        fn.allow_gc = self.allow_gc
-        fn.storage_map = storage_map
-        return (
-            fn,
-            [
-                Container(input, storage)
-                for input, storage in zip(fgraph.inputs, input_storage)
-            ],
-            [
-                Container(output, storage, readonly=True)
-                for output, storage in zip(fgraph.outputs, output_storage)
-            ],
-            thunks,
-            nodes,
-        )
--- a/aesara/link/jax/linker.py
+++ b/aesara/link/jax/linker.py
+from warnings import warn
+from numpy.random import RandomState
+from aesara.graph.basic import Constant
+from aesara.link.basic import Container, PerformLinker
+from aesara.link.utils import gc_helper, map_storage, streamline
+from aesara.utils import difference
+class JAXLinker(PerformLinker):
+    """A `Linker` that JIT-compiles NumPy-based operations using JAX.
+    Attributes
+    ----------
+    allow_non_jax: bool
+        A boolean indicating whether or not an exception is thrown when the
+        graph cannot be JAX compiled (e.g. the graph has an unsupported operator).
+        If `allow_non_jax` is `True`, the fallback is currently Python compilation.
+    """
+    allow_non_jax = False
+    def create_jax_thunks(
+        self, compute_map, order, input_storage, output_storage, storage_map
+    ):
+        """Create a thunk for each output of the `Linker`s `FunctionGraph`.
+        This is differs from the other thunk-making function in that it only
+        produces thunks for the `FunctionGraph` output nodes.
+        Parameters
+        ----------
+        compute_map: dict
+            The compute map dictionary.
+        storage_map: dict
+            The storage map dictionary.
+        Returns
+        -------
+        thunks: list
+            A tuple containing the thunks.
+        output_nodes: list and their
+            A tuple containing the output nodes.
+        """
+        import jax
+        from aesara.link.jax.dispatch import jax_funcify, jax_typify
+        output_nodes = [o.owner for o in self.fgraph.outputs]
+        # Create a JAX-compilable function from our `FunctionGraph`
+        jaxed_fgraph = jax_funcify(
+            self.fgraph,
+            input_storage=input_storage,
+            output_storage=output_storage,
+            storage_map=storage_map,
+        )
+        # I suppose we can consider `Constant`s to be "static" according to
+        # JAX.
+        static_argnums = [
+            n for n, i in enumerate(self.fgraph.inputs) if isinstance(i, Constant)
+        ]
+        thunk_inputs = []
+        for n in self.fgraph.inputs:
+            sinput = storage_map[n]
+            if isinstance(sinput[0], RandomState):
+                new_value = jax_typify(sinput[0], getattr(sinput[0], "dtype", None))
+                # We need to remove the reference-based connection to the
+                # original `RandomState`/shared variable's storage, because
+                # subsequent attempts to use the same shared variable within
+                # other non-JAXified graphs will have problems.
+                sinput = [new_value]
+            thunk_inputs.append(sinput)
+        thunks = []
+        thunk_outputs = [storage_map[n] for n in self.fgraph.outputs]
+        fgraph_jit = jax.jit(jaxed_fgraph, static_argnums)
+        def thunk(
+            fgraph=self.fgraph,
+            fgraph_jit=fgraph_jit,
+            thunk_inputs=thunk_inputs,
+            thunk_outputs=thunk_outputs,
+        ):
+            outputs = fgraph_jit(*[x[0] for x in thunk_inputs])
+            for o_node, o_storage, o_val in zip(fgraph.outputs, thunk_outputs, outputs):
+                compute_map[o_node][0] = True
+                if len(o_storage) > 1:
+                    assert len(o_storage) == len(o_val)
+                    for i, o_sub_val in enumerate(o_val):
+                        o_storage[i] = o_sub_val
+                else:
+                    o_storage[0] = o_val
+            return outputs
+        thunk.inputs = thunk_inputs
+        thunk.outputs = thunk_outputs
+        thunk.lazy = False
+        thunks.append(thunk)
+        # This is a bit hackish, but we only return one of the output nodes
+        return thunks, output_nodes[:1]
+    def make_all(self, input_storage=None, output_storage=None, storage_map=None):
+        fgraph = self.fgraph
+        nodes = self.schedule(fgraph)
+        no_recycling = self.no_recycling
+        input_storage, output_storage, storage_map = map_storage(
+            fgraph, nodes, input_storage, output_storage, storage_map
+        )
+        compute_map = {}
+        for k in storage_map:
+            compute_map[k] = [k.owner is None]
+        try:
+            # We need to create thunk functions that will populate the output
+            # storage arrays with the JAX-computed values.
+            thunks, nodes = self.create_jax_thunks(
+                compute_map, nodes, input_storage, output_storage, storage_map
+            )
+        except NotImplementedError as e:
+            if not self.allow_non_jax:
+                raise
+            warn(f"JaxLinker could not JAXify graph: {e}")
+            thunks = []
+            for node in nodes:
+                thunk = node.op.make_thunk(
+                    node, storage_map, compute_map, no_recycling, "py"
+                )
+                thunk_inputs = [storage_map[v] for v in node.inputs]
+                thunk_outputs = [storage_map[v] for v in node.outputs]
+                thunk.inputs = thunk_inputs
+                thunk.outputs = thunk_outputs
+                thunks.append(thunk)
+        computed, last_user = gc_helper(nodes)
+        if self.allow_gc:
+            post_thunk_old_storage = []
+            for node in nodes:
+                post_thunk_old_storage.append(
+                    [
+                        storage_map[input]
+                        for input in node.inputs
+                        if (input in computed)
+                        and (input not in fgraph.outputs)
+                        and (node == last_user[input])
+                    ]
+                )
+        else:
+            post_thunk_old_storage = None
+        if no_recycling is True:
+            no_recycling = list(storage_map.values())
+            no_recycling = difference(no_recycling, input_storage)
+        else:
+            no_recycling = [
+                storage_map[r] for r in no_recycling if r not in fgraph.inputs
+            ]
+        fn = streamline(
+            fgraph, thunks, nodes, post_thunk_old_storage, no_recycling=no_recycling
+        )
+        fn.allow_gc = self.allow_gc
+        fn.storage_map = storage_map
+        return (
+            fn,
+            [
+                Container(input, storage)
+                for input, storage in zip(fgraph.inputs, input_storage)
+            ],
+            [
+                Container(output, storage, readonly=True)
+                for output, storage in zip(fgraph.outputs, output_storage)
+            ],
+            thunks,
+            nodes,
+        )
--- a/doc/JaxOps.rst
+++ b/doc/JaxOps.rst
@@ -39,7 +39,7 @@ logic.
       return res if n_outs > 1 else res[0]
 *Code in context:*
-https://github.com/pymc-devs/aesara/blob/master/aesara/link/jax/jax_dispatch.py#L583
+https://github.com/pymc-devs/aesara/blob/master/aesara/link/jax/dispatch.py#L583
 Step 3: Register the function with the jax_funcify dispatcher
 =============================================================
@@ -49,9 +49,9 @@ function with the Aesara JAX Linker. This is done through the dispatcher
 decorator and closure as seen below. If unsure how dispatching works a
 short tutorial on dispatching is at the bottom.
-The linker functions should be added to ``jax_dispatch`` module linked
+The linker functions should be added to ``dispatch`` module linked
 below.
-https://github.com/pymc-devs/aesara/blob/master/aesara/link/jax/jax_dispatch.py
+https://github.com/pymc-devs/aesara/blob/master/aesara/link/jax/dispatch.py
 Here’s an example for the Eye Op.
@@ -69,7 +69,7 @@ Here’s an example for the Eye Op.
       return eye
 *Code in context:*
-https://github.com/pymc-devs/aesara/blob/master/aesara/link/jax/jax_dispatch.py#L1071
+https://github.com/pymc-devs/aesara/blob/master/aesara/link/jax/dispatch.py#L1071
 Step 4: Write tests
 ===================

--- a/setup.cfg
+++ b/setup.cfg
@@ -4,6 +4,8 @@ ignore = E203,E231,E501,E741,W503,W504,C901
 max-line-length = 88
 per-file-ignores =
    **/__init__.py:F401,E402,F403
+    aesara/link/jax/jax_dispatch.py:E402,F403,F401
+    aesara/link/jax/jax_linker.py:E402,F403,F401
    aesara/sparse/sandbox/sp2.py:F401
    tests/tensor/test_basic_scipy.py:E402
    tests/sparse/test_basic.py:E402

--- a/tests/link/test_jax.py
+++ b/tests/link/test_jax.py
@@ -321,7 +321,7 @@ def test_jax_Composite():
 def test_jax_FunctionGraph_names():
    import inspect
-    from aesara.link.jax.jax_dispatch import jax_funcify
+    from aesara.link.jax.dispatch import jax_funcify
    x = scalar("1x")
    y = scalar("_")
@@ -337,7 +337,7 @@ def test_jax_FunctionGraph_names():
 def test_jax_FunctionGraph_once():
    """Make sure that an output is only computed once when it's referenced multiple times."""
-    from aesara.link.jax.jax_dispatch import jax_funcify
+    from aesara.link.jax.dispatch import jax_funcify
    x = vector("x")
    y = vector("y")