rocm_jax/jax/experimental/jax2tf/call_tf.py

# Copyright 2021 The JAX Authors.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     https://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
"""Allows JAX to call TensorFlow functions with support for autodiff.

**Experimental: please give feedback, and expect changes.**

This module introduces the function :func:`call_tf` that allows JAX to call
TensorFlow functions.

For examples and details, see
https://github.com/jax-ml/jax/blob/main/jax/experimental/jax2tf/README.md#calling-tensorflow-functions-from-jax.

"""

from __future__ import annotations

from collections.abc import Callable, Sequence
import dataclasses
import functools
from typing import Any

from absl import logging
import jax
from jax import dlpack
from jax import dtypes
from jax import numpy as jnp
from jax import tree_util
from jax._src import ad_util
from jax._src import core
from jax._src import effects
from jax._src import util
from jax._src.lib import xla_client
from jax._src.lib.mlir import ir
from jax._src.lib.mlir.dialects import func as func_dialect
from jax._src.lib.mlir.dialects import hlo
from jax.experimental.jax2tf import jax2tf as jax2tf_internal
from jax._src.interpreters import mlir
import numpy as np
import tensorflow as tf


map = util.safe_map
zip = util.safe_zip

TfConcreteFunction = Any
TfVal = jax2tf_internal.TfVal

# The platforms for which to use DLPack to avoid copying (only works on GPU
# and CPU at the moment, and only for Array). For CPU we don't need
# DLPack, if we are careful.
_DLPACK_PLATFORMS = ("gpu",)

class UnspecifiedOutputShapeDtype:
  pass

def call_tf(
    callable_tf: Callable,
    has_side_effects=True,
    ordered=False,
    output_shape_dtype=UnspecifiedOutputShapeDtype(),
    call_tf_graph=False,
) -> Callable:
  """Calls a TensorFlow function from JAX, with support for reverse autodiff.

  The ``callable_tf`` will be called with TensorFlow-compatible arguments (
  numpy.ndarray, ``tf.Tensor`` or ``tf.Variable``) or pytrees thereof. The
  function must return the same type of results.

  If ``call_tf`` appears in a JAX staging context (:func:`jax.jit`,
  or :func:`jax.pmap`, or a control-flow primitive) then
  ``callable_tf`` will be compiled with ``tf.function(callable_tf,
  jit_compile=True)``
  and the resulting XLA computation will be embedded in JAX's XLA computation.

  If ``call_tf`` appears outside a JAX staging context, it will be called inline
  using TensorFlow eager mode.

  The ``call_tf`` supports JAX's reverse-mode autodiff, in which case the
  ``callable_tf`` will be differentiated using ``tf.GradientTape``. This means
  that the gradient will be TensorFlow-accurate, e.g., will respect the
  custom gradients that may be defined for the code in ``callable_tf``.

  For an example and more details see the
  `README
  <https://github.com/jax-ml/jax/blob/main/jax/experimental/jax2tf/README.md#calling-tensorflow-functions-from-jax>`_.

  Args:
    callable_tf: a TensorFlow Callable that can take a pytree of TensorFlow
      arguments.
    has_side_effects: if True then it ensures that instances of this primitive
      are not removed or replicated by JAX optimizations such as dead-code
      elimination.
    ordered: If true, calls are modeled as having ordered effects.
    output_shape_dtype: An optional declaration of the expected shape and dtype
      of the result of the called TensorFlow function. If given it will be used
      during JAX tracing to form the abstract values of the results of the
      `call_tf`. If not given then we form a `tf.Graph` for the called
      TensorFlow function and we use the TensorFlow-inferred shapes and types.
      Must be a pytree matching the structure of the nested structure returned
      from the TensorFlow function, containing objects with `.shape` and
      `.dtype` attributes, e.g., `jax.ShapeDtypeStruct` or `jax.Array`.
    call_tf_graph: EXPERIMENTAL, DO NOT USE. We may change the name in the
      future.

  Returns: a JAX callable that can be invoked with JAX pytree arguments, in
    op-by-op mode or in a staged context. This callable can be used with JAX's
    reverse-mode autodiff (:func:`jax.grad`).
  """
  @jax.custom_vjp
  def make_call(*args_jax):
    """We wrap it all in `make_call` so that we can attach custom VJP."""

    args_flat_jax, args_treedef = tree_util.tree_flatten(args_jax)
    # Canonicalize the arguments; e.g., makes them x32 if JAX is in 32-bit mode
    def canonical_arg(v):
      v = v if getattr(v, "dtype", None) else np.asarray(v)
      dtype = dtypes.canonicalize_dtype(v.dtype)
      if dtype != v.dtype:
        v = v.astype(dtype)
      return v

    args_flat_jax = tuple(map(canonical_arg, args_flat_jax))
    def make_tensorspec(a_jax):
      a_tf_dtype = jax2tf_internal._to_tf_dtype(a_jax.dtype)
      a_tf_shape = [d if core.is_constant_dim(d) else None for d in a_jax.shape]
      return tf.TensorSpec(a_tf_shape, a_tf_dtype)
    args_flat_sig_tf = tuple(map(make_tensorspec, args_flat_jax))

    if not isinstance(output_shape_dtype, UnspecifiedOutputShapeDtype):
      output_shape_dtype_flat, output_shape_dtype_tree = tree_util.tree_flatten(output_shape_dtype)
      output_avals = tuple(core.ShapedArray(st.shape, st.dtype) for st in output_shape_dtype_flat)
    else:
      output_avals, output_shape_dtype_tree = None, None

    res_treedef = None  # We'll store here the result treedef
    res_tf_flat = None  # For error reporting
    # The function below will be called at least once, either in eager
    # mode during jax2tf_call_tf or in graph mode during _get_concrete_function_tf()
    def callable_flat_tf(*args_tf_flat: TfVal) -> Sequence[TfVal]:
      args_tf = args_treedef.unflatten(args_tf_flat)
      res_tf = callable_tf(*args_tf)

      # b/279454591: When `callable_tf` is a tf function with zero outputs, it
      # returns a `StatefulPartitionedCall` (if the function is stateful) or
      # `PartitionedCall` (if the function is stateless) op instead of
      # tf.Tensors. We work around this issue by replacing the output `res_tf`
      # with an empty list.

      if isinstance(res_tf, tf.Operation):
        assert (
            res_tf.type == "StatefulPartitionedCall"
            or res_tf.type == "PartitionedCall"
        )
        t_out = res_tf.get_attr("Tout")
        # t_out should be an empty list.
        assert not t_out, (
            "The TF function returned an unexpected result, please check its"
            f" function body. res_tf = {res_tf}"
        )
        res_tf = t_out

      nonlocal res_treedef, res_tf_flat
      res_tf_flat, res_treedef_now = tree_util.tree_flatten(res_tf)
      assert res_treedef is None or res_treedef == res_treedef_now, (
          f"Subsequent calls had different results. Previous {res_treedef} and now {res_treedef_now}")
      res_treedef = res_treedef_now
      if output_avals is not None:
        if res_treedef != output_shape_dtype_tree:
          raise ValueError(
              "The pytree of the TensorFlow function results does not match the "
              "pytree of the declared output_shape_dtype:\n"
              f"results pytree: {res_treedef}\noutput_shape_dtype tree: {output_shape_dtype_tree}")
        assert len(output_avals) == len(res_tf_flat)

      checked_res_tf_flat = [
          check_tf_result(i, r_tf, r_aval)
          for i, (r_tf, r_aval) in enumerate(
              zip(res_tf_flat,
                  (output_avals
                   if output_avals is not None
                   else (None,) * len(res_tf_flat))))]
      return checked_res_tf_flat

    # Prepare a tf.function ahead of time, to cache the concrete functions. This
    # won't be used in op-by-op execution mode.
    function_flat_tf = tf.function(
        callable_flat_tf, autograph=False, jit_compile=not call_tf_graph)

    res_jax_flat = call_tf_p.bind(
        *args_flat_jax,
        # Carry the actual function such that op-by-op call can call in TF eager mode.
        callable_flat_tf=callable_flat_tf,
        function_flat_tf=function_flat_tf,
        args_flat_sig_tf=args_flat_sig_tf,
        output_avals=output_avals,
        has_side_effects=has_side_effects,
        ordered=ordered,
        call_tf_graph=call_tf_graph,
    )

    # We must have called callable_flat_tf by nοw
    assert res_treedef is not None
    return res_treedef.unflatten(res_jax_flat)

  # Define the fwd and bwd custom_vjp functions
  def make_call_vjp_fwd(*args_jax):
    # Return the primal arguments as the residual
    return make_call(*args_jax), args_jax

  def make_call_vjp_bwd(residual_jax, ct_res_jax):
    args_jax = residual_jax  # residual is the primal argument

    def tf_vjp_fun(args_tf, ct_res_tf):
      """Invoke TF gradient."""

      # TF does not like us to watch non-float vars or Nones.
      def replace_non_float_or_none(arg_tf):
        if arg_tf is not None and (
            arg_tf.dtype.is_floating or arg_tf.dtype.is_complex
        ):
          return arg_tf
        else:
          # When watched, this will be ignored. When used in results it will
          # result in a floating 0. gradient, which JAX will ignore (and
          # replace it with a float0)
          return tf.zeros((), dtype=tf.float32)

      watched_args_tf = tf.nest.map_structure(
          replace_non_float_or_none, args_tf
      )
      with tf.GradientTape(persistent=True) as tape:
        tape.watch(watched_args_tf)
        res = callable_tf(*args_tf)

      tf.nest.assert_same_structure(res, ct_res_tf)
      dres_darg = tape.gradient(
          tf.nest.map_structure(replace_non_float_or_none, res),
          sources=watched_args_tf,
          output_gradients=ct_res_tf,
          unconnected_gradients=tf.UnconnectedGradients.ZERO,
      )

      dres_darg = tree_util.tree_map(
          lambda x: x if x is None else tf.convert_to_tensor(x),
          dres_darg,
      )

      # callable_tf may mutate (the structure of) args_tf, thus we check against
      # watched_args_tf which should be structurally the same as the original
      # args_tf.
      tf.nest.assert_same_structure(dres_darg, watched_args_tf)
      return dres_darg

    # Use call_tf to call the VJP function
    ct_args_jax = call_tf(tf_vjp_fun)(args_jax, ct_res_jax)
    # We must make the float0s that JAX expects
    def fix_float0(arg_jax, ct_arg_jax):
      if arg_jax is None:
        return None
      arg_dtype = dtypes.result_type(arg_jax)  # May be scalar
      ct_arg_dtype = core.primal_dtype_to_tangent_dtype(arg_dtype)
      if ct_arg_dtype != ct_arg_jax.dtype:
        return ad_util.zeros_like_aval(core.ShapedArray(np.shape(arg_jax),
                                                        ct_arg_dtype))
      return ct_arg_jax

    ct_args_jax_fixed = tree_util.tree_map(fix_float0, args_jax, ct_args_jax,
                                           is_leaf=lambda x: x is None)
    return ct_args_jax_fixed

  make_call.defvjp(make_call_vjp_fwd, make_call_vjp_bwd)
  return util.wraps(callable_tf)(make_call)


def check_tf_result(idx: int, r_tf: TfVal, r_aval: core.ShapedArray | None) -> TfVal:
  # Check that the TF function returns values of expected types. This
  # improves error reporting, preventing hard-to-diagnose errors downstream
  try:
    jax2tf_internal._tfval_to_tensor_jax_dtype(r_tf)
  except Exception as e:
    msg = ("The called TF function returns a result that is not "
           f"convertible to JAX: {r_tf}.")
    raise ValueError(msg) from e

  if r_aval is None:
    return r_tf
  # We convert to TF type, and canonicalize to 32-bit if necessary
  r_aval_dtype_tf = jax2tf_internal._to_tf_dtype(r_aval.dtype)
  # Checking shapes is trickier in presence of dynamic shapes. I wish we could
  # check at runtime that the returned shape matches the declared shape. I wish
  # that tf.ensure_shape did this, but it can only take shapes that contain None
  # not computed shapes. However, in eager mode we should be able to resolve
  # the declared shapes to constants and we get better checking.
  if tf.executing_eagerly():
    r_aval_shape_tf = jax2tf_internal._eval_shape(r_aval.shape)
  else:
    r_aval_shape_tf = jax2tf_internal._aval_to_tf_shape(r_aval)
  # We do as much checking as we can here, instead of relying on tf.ensure_shape
  # because the latter gives different errors in eager vs. compiled mode.
  # TODO(b/279454591): This strange error is from TF. Eager function suppose
  # return tf Val with concrete shape but not.  Here we change exception to warn
  # and bypass it. This case need revisit on TF side.
  try:
    _ = len(r_tf.shape)
  except ValueError as e:
    msg = (
        "The shape check test cannot be performed because the shape of the"
        "`r_tf` tensor cannot be obtained."
        f"r_tf = {r_tf}, r_aval = {r_aval}"
    )
    msg += str(e)
    logging.warning(msg)
    return r_tf
  if (r_tf.dtype != r_aval_dtype_tf or
      len(r_tf.shape) != len(r_aval_shape_tf) or
      any(r_aval_d is not None and r_tf_d is not None and r_aval_d != r_tf_d
          for r_tf_d, r_aval_d in zip(r_tf.shape, r_aval_shape_tf))):
    msg = ("The shapes or dtypes returned by the TensorFlow function "
           "do not match the declared output_shape_dtype:\n"
           f"Result[{idx}] is {r_tf.dtype}[{r_tf.shape}] vs. expected {r_aval_dtype_tf}[{r_aval_shape_tf}]")
    raise ValueError(msg)
  # At this point tf.ensure_shape does not do much, it should never throw an
  # error, albeit it may refine the shape a bit.
  return tf.ensure_shape(r_tf, r_aval_shape_tf)


call_tf_p = core.Primitive("call_tf")
call_tf_p.multiple_results = True

# The impl will be used in op-by-op mode and calls callable_tf in TF eager mode.
def _call_tf_impl(*args_jax_flat, callable_flat_tf, **_):
  # On GPU we use dlpack to avoid copies of data to the host.
  def _arg_jax_to_tf(arg_jax):
    if (isinstance(arg_jax, jax.Array) and
        list(arg_jax.devices())[0].platform in _DLPACK_PLATFORMS and
        arg_jax.dtype.type in dlpack.SUPPORTED_DTYPES):
      arg_dlpack = jax.dlpack.to_dlpack(arg_jax)
      return tf.experimental.dlpack.from_dlpack(arg_dlpack)
    # The following avoids copies to the host on CPU, always for Array
    # and even for ndarray if they are sufficiently aligned.
    # TODO(necula): on TPU this copies to the host!
    if getattr(arg_jax, 'dtype', None) == dtypes.float0:
      return tf.zeros(shape=arg_jax.shape,
                      dtype=jax2tf_internal._tf_np_dtype_for_float0)
    return tf.constant(np.asarray(arg_jax))

  args_tf_flat = tuple(map(_arg_jax_to_tf, args_jax_flat))
  with jax2tf_internal.inside_call_tf():
    # Call in TF eager mode
    res_tf_flat = callable_flat_tf(*args_tf_flat)

  def _res_tf_to_jax(res_tf: TfVal):
    res_tf, jax_dtype = jax2tf_internal._tfval_to_tensor_jax_dtype(res_tf)
    if isinstance(res_tf, tf.Tensor) and jax_dtype.type in dlpack.SUPPORTED_DTYPES:
      res_tf_platform = tf.DeviceSpec.from_string(res_tf.backing_device).device_type
      res_jax_platform = res_tf_platform.lower()
      if res_jax_platform in _DLPACK_PLATFORMS:
        res_dlpack = tf.experimental.dlpack.to_dlpack(res_tf)
        return jax.dlpack.from_dlpack(res_dlpack)

    # When working with a bfloat16 scalar tf.Tensor,np.asarray() can fail.
    # To handle this special case, we create a numpy copy.
    if res_tf.shape == tf.TensorShape([]) and res_tf.dtype == tf.bfloat16:
      return jax.device_put(jnp.array(res_tf.numpy()))
    else:
      return jax.device_put(np.asarray(res_tf))

  return list(map(_res_tf_to_jax, res_tf_flat))


call_tf_p.def_impl(_call_tf_impl)

@functools.lru_cache(maxsize=128)
def _get_concrete_function_tf(function_flat_tf, args_flat_sig_tf):  # -> tf.ConcreteFunction
  with jax2tf_internal.inside_call_tf():
    return function_flat_tf.get_concrete_function(*args_flat_sig_tf)


# Mark the effectful instances of call_tf
@dataclasses.dataclass(frozen=True)
class CallTfEffect(effects.Effect):
  __str__ = lambda _: "CallTfEffect"

call_tf_effect = CallTfEffect()

effects.lowerable_effects.add_type(CallTfEffect)
effects.control_flow_allowed_effects.add_type(CallTfEffect)
effects.remat_allowed_effects.add_type(CallTfEffect)
effects.custom_derivatives_allowed_effects.add_type(CallTfEffect)


class CallTfOrderedEffect(effects.Effect):
  __str__ = lambda _: "CallTfOrderedEffect"


call_tf_ordered_effect = CallTfOrderedEffect()

effects.lowerable_effects.add_type(CallTfOrderedEffect)
effects.control_flow_allowed_effects.add_type(CallTfOrderedEffect)
effects.remat_allowed_effects.add_type(CallTfOrderedEffect)
effects.custom_derivatives_allowed_effects.add_type(CallTfOrderedEffect)
effects.ordered_effects.add_type(CallTfOrderedEffect)
effects.shardable_ordered_effects.add_type(CallTfOrderedEffect)


def _call_tf_abstract_eval(
    *args_flat_avals,
    function_flat_tf,
    args_flat_sig_tf,
    has_side_effects,
    ordered,
    output_avals,
    call_tf_graph,
    **__,
):
  # Called only when we form a Jaxpr, i.e., under jit, scan, etc.
  effects = set()
  if ordered:
    effects.add(call_tf_ordered_effect)
  elif has_side_effects:
    effects.add(call_tf_effect)

  # If no output_avals is given, then we ask TF to infer the output shapes.
  # We call this even if output_avals is given because it will ensure that
  # callable_flat_tf is called. Since _get_concrete_function_tf is cached
  # there is a small cost of calling it more often than needed.
  concrete_function_flat_tf = _get_concrete_function_tf(function_flat_tf,
                                                        args_flat_sig_tf)

  # In the case that the tf.function has no return value
  if len(concrete_function_flat_tf.outputs) == 0:
    return (), effects

  if output_avals is not None:
    return output_avals, effects

  def is_fully_known_shape(s):
    return s.rank is not None and all(d is not None for d in s)

  if all(is_fully_known_shape(s)
        for s in concrete_function_flat_tf.output_shapes):
    avals_from_tf = tuple(
        # We convert to JAX type, and canonicalize to 32-bit if necessary
        core.ShapedArray(shape, jax2tf_internal._to_jax_dtype(dtype))
        for dtype, shape in zip(concrete_function_flat_tf.output_dtypes,
                                concrete_function_flat_tf.output_shapes))
    return avals_from_tf, effects

  msg = ("call_tf cannot call functions whose output has dynamic shape. "
    f"Found output shapes: {concrete_function_flat_tf.output_shapes}. "
    "Consider using the `output_shape_dtype` argument to call_tf. "
    "\nSee https://github.com/jax-ml/jax/blob/main/jax/experimental/jax2tf/README.md#limitations-of-call_tf"
      " for a discussion.")
  raise ValueError(msg)


call_tf_p.def_effectful_abstract_eval(_call_tf_abstract_eval)


def _call_tf_lowering(
    ctx: mlir.LoweringRuleContext,
    *args_op,
    platform,
    function_flat_tf,
    args_flat_sig_tf,
    has_side_effects,
    ordered,
    call_tf_graph,
    output_avals,
    **_,
):
  # We use the same TF lowering device as for the embedding JAX computation.
  # One example when this is needed is when the code refers to variables on one
  # device. Or, for sharding annotations (only supported on TPU).

  if platform in ["cpu", "tpu"]:
    tf_platform = platform.upper()
  elif platform == "cuda":
    tf_platform = "GPU"
  else:
    raise ValueError("platform {platform} not supported")

  concrete_function_flat_tf = _get_concrete_function_tf(function_flat_tf, args_flat_sig_tf)

  captured_inputs = []
  if concrete_function_flat_tf.captured_inputs:
    # The function uses either captured variables or tensors.
    msg = (
        "call_tf works best with a TensorFlow function that does not capture "
        "variables or tensors from the context. "
        "See https://github.com/jax-ml/jax/blob/main/jax/experimental/jax2tf/README.md#limitations-of-call_tf for a discussion. "
        f"The following captures were found {concrete_function_flat_tf.captured_inputs}")
    logging.warning(msg)
    for inp in concrete_function_flat_tf.captured_inputs:
      if inp.dtype == tf.resource:  # A variable; lookup by handle
        inp_vars = [v for v in concrete_function_flat_tf.variables if inp is v.handle]
        assert len(inp_vars) == 1, f"Found {inp_vars}"
        captured_inputs.append(inp_vars[0])
      else:
        captured_inputs.append(inp)

  # The following use case happens when we call_tf a restored saved model that
  # includes parameters (hence functions closing over tf.Variable), and then
  # we jax2tf.convert it with native serialization, under tf.function (or
  # for saving to saved model). The `np.asarray(inp)` fails because it thinks
  # it is in TF graph mode. The `tf.init_scope()` lifts out of function-building
  # graph scopes, and allows us to read the values of the variables
  with tf.init_scope():
    captured_ops = tuple(
        mlir.ir_constant(np.asarray(inp))
        for inp in captured_inputs
    )

  if call_tf_graph:
    with jax2tf_internal.inside_call_tf():
      return emit_tf_embedded_graph_custom_call(
          ctx,
          concrete_function_flat_tf,
          tuple(args_op) + captured_ops,
          has_side_effects,
          ordered,
          output_avals,
      )

  def convert_to_spec(x):
    if isinstance(x, tf.TensorSpec):
      return x
    else:
      return tf.TensorSpec.from_tensor(x)

  args_tf_flat = [convert_to_spec(a) for a in args_flat_sig_tf]

  with jax2tf_internal.inside_call_tf():
    try:
      func_tf_hlo = function_flat_tf.experimental_get_compiler_ir(
          *args_tf_flat
      )(stage="hlo_serialized", platform_name=tf_platform)
    except Exception as e:
      msg = ("Error compiling TensorFlow function (see below for the caught exception)." +
             "\ncall_tf can used " +
              "in a staged context (under jax.jit, lax.scan, etc.) only with " +
              "compilable functions with static output shapes.\n" +
              "See https://github.com/jax-ml/jax/blob/main/jax/experimental/jax2tf/README.md#limitations-of-call_tf for a discussion." +
             "\n\nCaught TensorFlow exception: " + str(e))
      raise ValueError(msg) from e

  xla_comp = xla_client.XlaComputation(func_tf_hlo)

  # Canonicalize the results; e.g., makes them x32 if JAX is in 32-bit mode
  def canonical_res_aval(res_shape: xla_client.Shape) -> core.ShapedArray:
    if not res_shape.is_static():
      msg = ("Compiled TensorFlow function has dynamic output shape " +
             f"{res_shape}. call_tf can used " +
             "in a staged context (under jax.jit, lax.scan, etc.) only with " +
             "compilable functions with static output shapes. " +
             "See https://github.com/jax-ml/jax/blob/main/jax/experimental/jax2tf/README.md#limitations-of-call_tf for a discussion.")
      raise ValueError(msg)

    res_dtype = res_shape.numpy_dtype()
    jax_res_dtype = dtypes.canonicalize_dtype(res_dtype)
    return core.ShapedArray(res_shape.dimensions(), jax_res_dtype)

  result_shape = xla_comp.program_shape().result_shape()
  if not result_shape.is_tuple():
    # TF does not wrap singletons as tuples, but JAX expects tuples because
    # call_tf is a multiple_results primitive.
    result_shapes = (result_shape,)
  else:
    result_shapes = result_shape.tuple_shapes()  # type: ignore

  result_avals = tuple(map(canonical_res_aval, result_shapes))

  submodule = mlir.xla_computation_to_mlir_module(xla_comp)
  symtab = ir.SymbolTable(submodule.operation)
  callee_result_types = symtab["main"].type.results
  fn = mlir.merge_mlir_modules(ctx.module_context.module,
                               f"call_tf_{function_flat_tf.name}",
                               submodule,
                               dst_symtab=ctx.module_context.symbol_table)
  call = func_dialect.CallOp(callee_result_types,
                             ir.FlatSymbolRefAttr.get(fn),
                             tuple(args_op) + captured_ops)
  flat_results = call.results

  if ordered:
    raise NotImplementedError(
        "ordered=True is not supported in the jitted context without"
        " `call_tf_graph=True`"
    )

  outputs = []
  for op, res_aval, res_shape in zip(flat_results, result_avals,
                                     result_shapes):
    if res_aval.dtype != res_shape.numpy_dtype():
      op = hlo.ConvertOp(mlir.aval_to_ir_type(res_aval), op).result
    outputs.append(op)
  return outputs


def _register_call_lowering(platform):
  mlir.register_lowering(call_tf_p, functools.partial(_call_tf_lowering,
                                                      platform=platform),
                         platform=platform)
for platform in ("cpu", "cuda", "tpu"):
  _register_call_lowering(platform)

# Support the call_tf under jax2tf.convert in eager mode
def _jax2tf_call_tf(*args: TfVal,
                    callable_flat_tf: Callable,
                    **_) -> TfVal:
  with jax2tf_internal.inside_call_tf():
    res_tf_flat = callable_flat_tf(*args)
  return res_tf_flat

jax2tf_internal.tf_impl[call_tf_p] = _jax2tf_call_tf


def emit_tf_embedded_graph_custom_call(
    ctx: mlir.LoweringRuleContext,
    concrete_function_flat_tf,
    operands: Sequence[ir.Value],
    has_side_effects,
    ordered,
    output_avals,
):
  """Emits a custom call referencing a tf.Graph embedding of the TF function.

  All call_tf called function information is stored in tf.metadata.
  This includes:
  (1) The called function name: This name will be used by the runtime to execute
  the callback.
  (2) The called function index in the XLACallModule `function_list` attribute.
  """
  call_tf_concrete_function_list = jax2tf_internal.get_thread_local_state_call_tf_concrete_function_list()
  if call_tf_concrete_function_list is None:
    raise ValueError(
        "call_tf_graph=True only support exporting by jax2tf.convert currently."
    )
  # TODO(necula): It is dangerous to modify global state when lowering because
  # there are a number of lowering caches that only cache the StableHLO.
  # See call_tf_test.py:test_multi_platform_call_tf_graph.
  called_index = add_to_call_tf_concrete_function_list(
      concrete_function_flat_tf, call_tf_concrete_function_list)
  tf_backend_config = {
      "has_token_input_output": ir.BoolAttr.get(ordered),
      "called_index": mlir.i64_attr(called_index),
  }
  result_avals = ctx.avals_out if ctx.avals_out is not None else ()

  operands = list(operands)
  result_types = list(
      mlir.flatten_ir_types([mlir.aval_to_ir_type(aval) for aval in result_avals])
  )
  if ordered:
    operands.insert(0, ctx.tokens_in.get(call_tf_ordered_effect))
    result_types.insert(0, mlir.token_type())

  custom_call = hlo.CustomCallOp(
      result_types,
      operands,
      call_target_name=ir.StringAttr.get("tf.call_tf_function"),
      has_side_effect=ir.BoolAttr.get(has_side_effects),
      api_version=mlir.i32_attr(2),
      called_computations=ir.ArrayAttr.get([]),
      backend_config=ir.StringAttr.get(""),
  )
  # Store TF metadata in unregistered attribute
  custom_call.attributes["tf.backend_config"] = ir.DictAttr.get(
      tf_backend_config
  )

  results = list(custom_call.results)
  if ordered:
    token = results.pop(0)
    ctx.set_tokens_out(mlir.TokenSet({call_tf_ordered_effect: token}))

  return results


def add_to_call_tf_concrete_function_list(concrete_tf_fn: Any, call_tf_concrete_function_list: list[Any]) -> int:
  try:
    called_index = call_tf_concrete_function_list.index(concrete_tf_fn)
  except ValueError:
    called_index = len(call_tf_concrete_function_list)
    call_tf_concrete_function_list.append(concrete_tf_fn)
  return called_index
-												Change JAX's copyright attribution from "Google LLC" to "The JAX Authors.".

See https://opensource.google/documentation/reference/releasing/contributions#copyright for more details.

PiperOrigin-RevId: 476167538

											
										
										
											2022-09-22 12:26:48 -07:00
+								# Copyright 2021 The JAX Authors.
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
+								#
 								# Licensed under the Apache License, Version 2.0 (the "License");
 								# you may not use this file except in compliance with the License.
 								# You may obtain a copy of the License at
 								#
 								#     https://www.apache.org/licenses/LICENSE-2.0
 								#
 								# Unless required by applicable law or agreed to in writing, software
 								# distributed under the License is distributed on an "AS IS" BASIS,
 								# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 								# See the License for the specific language governing permissions and
 								# limitations under the License.
 								"""Allows JAX to call TensorFlow functions with support for autodiff.
 								**Experimental: please give feedback, and expect changes.**
 								This module introduces the function :func:`call_tf` that allows JAX to call
 								TensorFlow functions.
 								For examples and details, see
-												Update references to the GitHub url in JAX codebase to reflect move from google/jax to jax-ml/jax

PiperOrigin-RevId: 676843138

											
										
										
											2024-09-20 07:51:48 -07:00
+								https://github.com/jax-ml/jax/blob/main/jax/experimental/jax2tf/README.md#calling-tensorflow-functions-from-jax.
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
 								"""
-												Upgrade remaining sources to Python 3.9

This PR is a follow up to #18881.

The changes were generated by adding

    from __future__ import annotations

to the files which did not already have them and running

    pyupgrade --py39-plus --keep-percent-format {jax,tests,jaxlib,examples,benchmarks}/**/*.py

											
										
										
											2023-12-11 13:59:29 +00:00
 								from __future__ import annotations
-												Run `pyupgrade --py310-plus`.

Also apply manual fixes to import sorting and unused imports.

											
										
										
											2024-06-26 14:44:52 -04:00
+								from collections.abc import Callable, Sequence
-												[export] Fix the serialization of effects

We currently support only the serialization of effects with
nullary constructors. We must also ensure that upon deserialization
we produce an event that tests equal to the original one.
Here we add explicit error checks and tests.

We also make the CallTfEffect to have this property.

											
										
										
											2023-12-13 15:43:12 +01:00
+								import dataclasses
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
+								import functools
-												Run `pyupgrade --py310-plus`.

Also apply manual fixes to import sorting and unused imports.

											
										
										
											2024-06-26 14:44:52 -04:00
+								from typing import Any
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
-												[call_tf] Use the same platform for TF lowering as the embedding JAX computation

This requires some changes for abstract evaluation, when
JAX does not use a specific platform.

Also attempt to fix the case when the TF lowering fails because the TF computation
uses a tf.Variable on another device as that used for lowering.

PiperOrigin-RevId: 492112847

											
										
										
											2022-11-30 23:21:55 -08:00
+								from absl import logging
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
+								import jax
-												[call_tf] Add support for DLPack to avoid copying arrays in eager mode

											
										
										
											2021-02-05 12:04:25 +02:00
+								from jax import dlpack
-												[call_tf] Fixed the handling of x64 values in JAX_ENABLE_X64=False

TensorFlow interprets Python scalars in x64 mode, or it may contain
explicit x64 computation. When used with call_tf, we canonicalize
inputs and outputs using the JAX rules.

											
										
										
											2021-06-16 13:25:56 +03:00
+								from jax import dtypes
-												Fix the simple bug on call_tf.replace_non_float and add unittest for floating and complex data type.

PiperOrigin-RevId: 510055139

											
										
										
											2023-02-15 23:40:12 -08:00
+								from jax import numpy as jnp
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
+								from jax import tree_util
-												Refactor effects system to use effect types, not objects

											
										
										
											2023-02-01 17:50:00 -08:00
+								from jax._src import ad_util
-												[2/n] Embed the tf.Graph into the stablehlo.custom_call.

PiperOrigin-RevId: 527302563

											
										
										
											2023-04-26 10:20:12 -07:00
+								from jax._src import core
-												Refactor effects system to use effect types, not objects

											
										
										
											2023-02-01 17:50:00 -08:00
+								from jax._src import effects
 								from jax._src import util
-												[2/n] Embed the tf.Graph into the stablehlo.custom_call.

PiperOrigin-RevId: 527302563

											
										
										
											2023-04-26 10:20:12 -07:00
+								from jax._src.lib import xla_client
-												[MHLO] Switch call_tf to use an MHLO lowering (attempt 2).

In passing refactor and fix some bugs in the MHLO helper code:
* mlir.ir_constant() failed to propagate its canonicalize_types argument to its callee.
* Refactor the code to convert an XLA computation to an MHLO module and to merge two MHLO modules from the XLA fallback translation rule path.
* Fix symbol (alpha) renaming of call operator callees when merging MHLO modules.

Attempt 2: In this iteration of the merge_mhlo_modules function, move all the operators into the target module first before doing any symbol table manipulation.

PiperOrigin-RevId: 442904129

											
										
										
											2022-04-19 13:59:28 -07:00
+								from jax._src.lib.mlir import ir
 								from jax._src.lib.mlir.dialects import func as func_dialect
-												(NFC) Prepare for migration from producing MHLO to producing StableHLO

This CL renames occurrences of "mhlo" in: 1) names, 2) tests, 3) prose in order
to prepare for the upcoming migration.

Unchanged occurrences:
  1) Public API that contains "mhlo", e.g. XlaLowering.mhlo and the "mhlo"
     argument value in Lowering.as_text and Lowering.compiler_ir.
  2) Documentation (changelog, JEPs, IR examples, etc).
  3) One rare situation where prose says "StableHLO" and "MHLO" in one sentence,
     so both are necessary to disambiguate.

PiperOrigin-RevId: 495771153

											
										
										
											2022-12-15 20:59:34 -08:00
+								from jax._src.lib.mlir.dialects import hlo
-												Use imports relative to the `jax` package consistently, rather than `.`-relative imports.

This is more consistent, since currently we use a mix of both styles. It may also help pytype yield more accurate types.

PiperOrigin-RevId: 412057514

											
										
										
											2021-11-24 07:47:48 -08:00
+								from jax.experimental.jax2tf import jax2tf as jax2tf_internal
-												Merge pull request #22263 from hawkinsp:tuples

PiperOrigin-RevId: 653267867

											
										
										
											2024-07-17 09:56:18 -07:00
+								from jax._src.interpreters import mlir
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
+								import numpy as np
-												[2/n] Embed the tf.Graph into the stablehlo.custom_call.

PiperOrigin-RevId: 527302563

											
										
										
											2023-04-26 10:20:12 -07:00
+								import tensorflow as tf
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
-												[call_tf] Fixed the handling of x64 values in JAX_ENABLE_X64=False

TensorFlow interprets Python scalars in x64 mode, or it may contain
explicit x64 computation. When used with call_tf, we canonicalize
inputs and outputs using the JAX rules.

											
										
										
											2021-06-16 13:25:56 +03:00
+								map = util.safe_map
 								zip = util.safe_zip
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
+								TfConcreteFunction = Any
-												[shape_poly, call_tf] Some improvements for call_tf in a shape polymorphic program

This is another attempt to land a rolled-back change https://github.com/google/jax/pull/14734 (cl/514070997).
See b/272154366 for more details.

The use case for call_tf with shape polymorphism is when we have a JAX program
that calls into TF function, and we want to serialize the JAX program with
some shapes unknown. Previously this use case did not work, except in the special
case when the output shape of the called TF function returns statically known
shapes.

The idea is that we allow the user of call_tf to specify the output shape.
This can be done even in presence of shape polymorphism, by writing the
output shape as an expression in terms of the input shapes. This is what
other JAX primitives do, e.g., concat, so we are simply enabling call_tf
to get the same behavior.

This change should be enough for old-style jax2tf, but will require more
work for native serialization.

We also removed some old code that was trying to workaround some limitations
in shape inference in TF. I think that those workarounds are ugly, and I am
prepared to give error messages rather than keep that code. So far no
tests fail.

PiperOrigin-RevId: 515137407

											
										
										
											2023-03-08 14:09:35 -08:00
+								TfVal = jax2tf_internal.TfVal
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
-												[call_tf] Add support for DLPack to avoid copying arrays in eager mode

											
										
										
											2021-02-05 12:04:25 +02:00
+								# The platforms for which to use DLPack to avoid copying (only works on GPU
-												Replace references to DeviceArray with Array.

A number of stale references are lurking in our documentation.

											
										
										
											2023-08-18 16:50:36 -04:00
+								# and CPU at the moment, and only for Array). For CPU we don't need
-												[call_tf] Add support for DLPack to avoid copying arrays in eager mode

											
										
										
											2021-02-05 12:04:25 +02:00
+								# DLPack, if we are careful.
 								_DLPACK_PLATFORMS = ("gpu",)
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
-												Improve the default value of `output_shape_dtype`.

PiperOrigin-RevId: 549988693

											
										
										
											2023-07-21 10:43:03 -07:00
+								class UnspecifiedOutputShapeDtype:
 								  pass
-												[1/n] store embedded tf.graph to stablehlo.custom_call

PiperOrigin-RevId: 519194911

											
										
										
											2023-03-24 11:26:44 -07:00
 								def call_tf(
 								    callable_tf: Callable,
 								    has_side_effects=True,
-												Add (optional) ordered effects for `jax2tf.call_tf`

This allows users to express nested TensorFlow computation that must be ordered during execution. It leverages the existing JAX effects system to model such side effects and lower them to use XLA tokens.

With this change, `jax2tf.call_tf(ordered=True)` can be used to generate ordered TF calls. This has the following behavior:

* With `call_tf_graph=True`, this generates a custom call op with the following differences: (1) a `!stablehlo.token` argument/result is prepended to each custom call's argument/result list and (2) `tf.backend_config` has an additional `has_token_input_output = true` entry.
* Without `call_tf_graph=True`, this raises a `NotImplementedError()`.

For this, `jax_export.py` makes sure that dummy arguments/results added for ordered effects are not exposed to the public interface by passing constant values in a wrapper function. Because of this, adding ordered effects to jax2tf-ed computation no longer causes calling convention changes and can be safely allowed.

Example StableHLO produced from the added test:

```
module @jit_f_jax attributes {mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
  func.func public @main(%arg0: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.constant dense<> : tensor<0xi1>
    %1:2 = call @_wrapped_jax_export_main(%0, %arg0) : (tensor<0xi1>, tensor<f32>) -> (tensor<0xi1>, tensor<f32>)
    return %1#1 : tensor<f32>
  }
  func.func private @_wrapped_jax_export_main(%arg0: tensor<0xi1> {jax.token = true}, %arg1: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<0xi1> {jax.token = true}, tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.create_token : !stablehlo.token
    %1 = stablehlo.constant dense<0> : tensor<i32>
    %2:3 = stablehlo.while(%iterArg = %0, %iterArg_0 = %1, %iterArg_1 = %arg1) : !stablehlo.token, tensor<i32>, tensor<f32>
     cond {
      %4 = stablehlo.constant dense<4> : tensor<i32>
      %5 = stablehlo.compare  LT, %iterArg_0, %4,  SIGNED : (tensor<i32>, tensor<i32>) -> tensor<i1>
      stablehlo.return %5 : tensor<i1>
    } do {
      %4 = stablehlo.custom_call @tf.call_tf_function(%iterArg, %iterArg_1) {api_version = 2 : i32, has_side_effect = true, tf.backend_config = {caller_name = "__inference_callable_flat_tf_10", has_token_input_output = true}} : (!stablehlo.token, tensor<f32>) -> !stablehlo.token
      %5 = stablehlo.constant dense<1.000000e+00> : tensor<f32>
      %6 = stablehlo.add %iterArg_1, %5 : tensor<f32>
      %7 = stablehlo.constant dense<1> : tensor<i32>
      %8 = stablehlo.add %iterArg_0, %7 : tensor<i32>
      stablehlo.return %4, %8, %6 : !stablehlo.token, tensor<i32>, tensor<f32>
    }
    %3 = stablehlo.constant dense<> : tensor<0xi1>
    return %3, %2#2 : tensor<0xi1>, tensor<f32>
  }
}
```

PiperOrigin-RevId: 534926215

											
										
										
											2023-05-24 11:47:58 -07:00
+								    ordered=False,
-												Improve the default value of `output_shape_dtype`.

PiperOrigin-RevId: 549988693

											
										
										
											2023-07-21 10:43:03 -07:00
+								    output_shape_dtype=UnspecifiedOutputShapeDtype(),
-												Bump XLACallModule to version 5 and add the function_list.

PiperOrigin-RevId: 529106145

											
										
										
											2023-05-03 09:04:01 -07:00
+								    call_tf_graph=False,
-												[1/n] store embedded tf.graph to stablehlo.custom_call

PiperOrigin-RevId: 519194911

											
										
										
											2023-03-24 11:26:44 -07:00
+								) -> Callable:
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
+								  """Calls a TensorFlow function from JAX, with support for reverse autodiff.
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
+								  The ``callable_tf`` will be called with TensorFlow-compatible arguments (
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
+								  numpy.ndarray, ``tf.Tensor`` or ``tf.Variable``) or pytrees thereof. The
 								  function must return the same type of results.
 								  If ``call_tf`` appears in a JAX staging context (:func:`jax.jit`,
-												Delete `xmap` and the `jax.experimental.maps` module. It's been 5 months since its deprecation (more than the standard 3 months deprecation period).

PiperOrigin-RevId: 655614395

											
										
										
											2024-07-24 10:23:29 -07:00
+								  or :func:`jax.pmap`, or a control-flow primitive) then
-												[1/n] store embedded tf.graph to stablehlo.custom_call

PiperOrigin-RevId: 519194911

											
										
										
											2023-03-24 11:26:44 -07:00
+								  ``callable_tf`` will be compiled with ``tf.function(callable_tf,
 								  jit_compile=True)``
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
+								  and the resulting XLA computation will be embedded in JAX's XLA computation.
 								  If ``call_tf`` appears outside a JAX staging context, it will be called inline
 								  using TensorFlow eager mode.
 								  The ``call_tf`` supports JAX's reverse-mode autodiff, in which case the
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
+								  ``callable_tf`` will be differentiated using ``tf.GradientTape``. This means
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
+								  that the gradient will be TensorFlow-accurate, e.g., will respect the
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
+								  custom gradients that may be defined for the code in ``callable_tf``.
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
 								  For an example and more details see the
-												[1/n] store embedded tf.graph to stablehlo.custom_call

PiperOrigin-RevId: 519194911

											
										
										
											2023-03-24 11:26:44 -07:00
+								  `README
-												Update references to the GitHub url in JAX codebase to reflect move from google/jax to jax-ml/jax

PiperOrigin-RevId: 676843138

											
										
										
											2024-09-20 07:51:48 -07:00
+								  <https://github.com/jax-ml/jax/blob/main/jax/experimental/jax2tf/README.md#calling-tensorflow-functions-from-jax>`_.
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
 								  Args:
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
+								    callable_tf: a TensorFlow Callable that can take a pytree of TensorFlow
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
+								      arguments.
-												[call_tf] Add has_side_effects parameter

The CallTfEffect was added recently as an internal workaround for
DCE removing instances of call_tf. Here we add a parameter to
`call_tf` to be able to declare if the called computation is
effectful and should not be removed by DCE.

											
										
										
											2023-01-12 08:44:53 +01:00
+								    has_side_effects: if True then it ensures that instances of this primitive
 								      are not removed or replicated by JAX optimizations such as dead-code
 								      elimination.
-												Add (optional) ordered effects for `jax2tf.call_tf`

This allows users to express nested TensorFlow computation that must be ordered during execution. It leverages the existing JAX effects system to model such side effects and lower them to use XLA tokens.

With this change, `jax2tf.call_tf(ordered=True)` can be used to generate ordered TF calls. This has the following behavior:

* With `call_tf_graph=True`, this generates a custom call op with the following differences: (1) a `!stablehlo.token` argument/result is prepended to each custom call's argument/result list and (2) `tf.backend_config` has an additional `has_token_input_output = true` entry.
* Without `call_tf_graph=True`, this raises a `NotImplementedError()`.

For this, `jax_export.py` makes sure that dummy arguments/results added for ordered effects are not exposed to the public interface by passing constant values in a wrapper function. Because of this, adding ordered effects to jax2tf-ed computation no longer causes calling convention changes and can be safely allowed.

Example StableHLO produced from the added test:

```
module @jit_f_jax attributes {mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
  func.func public @main(%arg0: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.constant dense<> : tensor<0xi1>
    %1:2 = call @_wrapped_jax_export_main(%0, %arg0) : (tensor<0xi1>, tensor<f32>) -> (tensor<0xi1>, tensor<f32>)
    return %1#1 : tensor<f32>
  }
  func.func private @_wrapped_jax_export_main(%arg0: tensor<0xi1> {jax.token = true}, %arg1: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<0xi1> {jax.token = true}, tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.create_token : !stablehlo.token
    %1 = stablehlo.constant dense<0> : tensor<i32>
    %2:3 = stablehlo.while(%iterArg = %0, %iterArg_0 = %1, %iterArg_1 = %arg1) : !stablehlo.token, tensor<i32>, tensor<f32>
     cond {
      %4 = stablehlo.constant dense<4> : tensor<i32>
      %5 = stablehlo.compare  LT, %iterArg_0, %4,  SIGNED : (tensor<i32>, tensor<i32>) -> tensor<i1>
      stablehlo.return %5 : tensor<i1>
    } do {
      %4 = stablehlo.custom_call @tf.call_tf_function(%iterArg, %iterArg_1) {api_version = 2 : i32, has_side_effect = true, tf.backend_config = {caller_name = "__inference_callable_flat_tf_10", has_token_input_output = true}} : (!stablehlo.token, tensor<f32>) -> !stablehlo.token
      %5 = stablehlo.constant dense<1.000000e+00> : tensor<f32>
      %6 = stablehlo.add %iterArg_1, %5 : tensor<f32>
      %7 = stablehlo.constant dense<1> : tensor<i32>
      %8 = stablehlo.add %iterArg_0, %7 : tensor<i32>
      stablehlo.return %4, %8, %6 : !stablehlo.token, tensor<i32>, tensor<f32>
    }
    %3 = stablehlo.constant dense<> : tensor<0xi1>
    return %3, %2#2 : tensor<0xi1>, tensor<f32>
  }
}
```

PiperOrigin-RevId: 534926215

											
										
										
											2023-05-24 11:47:58 -07:00
+								    ordered: If true, calls are modeled as having ordered effects.
 								    output_shape_dtype: An optional declaration of the expected shape and dtype
 								      of the result of the called TensorFlow function. If given it will be used
 								      during JAX tracing to form the abstract values of the results of the
-												[1/n] store embedded tf.graph to stablehlo.custom_call

PiperOrigin-RevId: 519194911

											
										
										
											2023-03-24 11:26:44 -07:00
+								      `call_tf`. If not given then we form a `tf.Graph` for the called
 								      TensorFlow function and we use the TensorFlow-inferred shapes and types.
 								      Must be a pytree matching the structure of the nested structure returned
 								      from the TensorFlow function, containing objects with `.shape` and
 								      `.dtype` attributes, e.g., `jax.ShapeDtypeStruct` or `jax.Array`.
-												Bump XLACallModule to version 5 and add the function_list.

PiperOrigin-RevId: 529106145

											
										
										
											2023-05-03 09:04:01 -07:00
+								    call_tf_graph: EXPERIMENTAL, DO NOT USE. We may change the name in the
 								      future.
-												Add (optional) ordered effects for `jax2tf.call_tf`

This allows users to express nested TensorFlow computation that must be ordered during execution. It leverages the existing JAX effects system to model such side effects and lower them to use XLA tokens.

With this change, `jax2tf.call_tf(ordered=True)` can be used to generate ordered TF calls. This has the following behavior:

* With `call_tf_graph=True`, this generates a custom call op with the following differences: (1) a `!stablehlo.token` argument/result is prepended to each custom call's argument/result list and (2) `tf.backend_config` has an additional `has_token_input_output = true` entry.
* Without `call_tf_graph=True`, this raises a `NotImplementedError()`.

For this, `jax_export.py` makes sure that dummy arguments/results added for ordered effects are not exposed to the public interface by passing constant values in a wrapper function. Because of this, adding ordered effects to jax2tf-ed computation no longer causes calling convention changes and can be safely allowed.

Example StableHLO produced from the added test:

```
module @jit_f_jax attributes {mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
  func.func public @main(%arg0: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.constant dense<> : tensor<0xi1>
    %1:2 = call @_wrapped_jax_export_main(%0, %arg0) : (tensor<0xi1>, tensor<f32>) -> (tensor<0xi1>, tensor<f32>)
    return %1#1 : tensor<f32>
  }
  func.func private @_wrapped_jax_export_main(%arg0: tensor<0xi1> {jax.token = true}, %arg1: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<0xi1> {jax.token = true}, tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.create_token : !stablehlo.token
    %1 = stablehlo.constant dense<0> : tensor<i32>
    %2:3 = stablehlo.while(%iterArg = %0, %iterArg_0 = %1, %iterArg_1 = %arg1) : !stablehlo.token, tensor<i32>, tensor<f32>
     cond {
      %4 = stablehlo.constant dense<4> : tensor<i32>
      %5 = stablehlo.compare  LT, %iterArg_0, %4,  SIGNED : (tensor<i32>, tensor<i32>) -> tensor<i1>
      stablehlo.return %5 : tensor<i1>
    } do {
      %4 = stablehlo.custom_call @tf.call_tf_function(%iterArg, %iterArg_1) {api_version = 2 : i32, has_side_effect = true, tf.backend_config = {caller_name = "__inference_callable_flat_tf_10", has_token_input_output = true}} : (!stablehlo.token, tensor<f32>) -> !stablehlo.token
      %5 = stablehlo.constant dense<1.000000e+00> : tensor<f32>
      %6 = stablehlo.add %iterArg_1, %5 : tensor<f32>
      %7 = stablehlo.constant dense<1> : tensor<i32>
      %8 = stablehlo.add %iterArg_0, %7 : tensor<i32>
      stablehlo.return %4, %8, %6 : !stablehlo.token, tensor<i32>, tensor<f32>
    }
    %3 = stablehlo.constant dense<> : tensor<0xi1>
    return %3, %2#2 : tensor<0xi1>, tensor<f32>
  }
}
```

PiperOrigin-RevId: 534926215

											
										
										
											2023-05-24 11:47:58 -07:00
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
+								  Returns: a JAX callable that can be invoked with JAX pytree arguments, in
-												[1/n] store embedded tf.graph to stablehlo.custom_call

PiperOrigin-RevId: 519194911

											
										
										
											2023-03-24 11:26:44 -07:00
+								    op-by-op mode or in a staged context. This callable can be used with JAX's
 								    reverse-mode autodiff (:func:`jax.grad`).
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
+								  """
 								  @jax.custom_vjp
 								  def make_call(*args_jax):
 								    """We wrap it all in `make_call` so that we can attach custom VJP."""
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
+								    args_flat_jax, args_treedef = tree_util.tree_flatten(args_jax)
-												[call_tf] Fixed the handling of x64 values in JAX_ENABLE_X64=False

TensorFlow interprets Python scalars in x64 mode, or it may contain
explicit x64 computation. When used with call_tf, we canonicalize
inputs and outputs using the JAX rules.

											
										
										
											2021-06-16 13:25:56 +03:00
+								    # Canonicalize the arguments; e.g., makes them x32 if JAX is in 32-bit mode
 								    def canonical_arg(v):
 								      v = v if getattr(v, "dtype", None) else np.asarray(v)
 								      dtype = dtypes.canonicalize_dtype(v.dtype)
 								      if dtype != v.dtype:
 								        v = v.astype(dtype)
 								      return v
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
+								    args_flat_jax = tuple(map(canonical_arg, args_flat_jax))
-												[jax2tf] Improved error checking for call_tf.

Cleaned up the abstract evaluation for call_tf to
work around a bug in TF whereby experimental_get_compiler_ir
cannot be used in a tf.function context.

Added more error messages, e.g., for the case when
the TF function has shape-influencing inputs.

											
										
										
											2021-07-10 18:49:25 +03:00
+								    def make_tensorspec(a_jax):
 								      a_tf_dtype = jax2tf_internal._to_tf_dtype(a_jax.dtype)
-												[call_tf] Some cleanup of call_tf

The main cleanup is around _code_generator_and_avals, which in
an earlier version of the code was used for both abstract values
and for code generation. That is why it was cached, and why it
returned a code generator and abstract values. A while
ago we did a first round of cleaning to not use it for abstract
values. Now we can actually eliminate the function and inline
it directly.

A second improvement is to add the explicit error message from
TF commpilation, instead of just the generic message that
call_tf cannot be used with non-compileable functions.

											
										
										
											2023-04-27 13:42:23 +02:00
+								      a_tf_shape = [d if core.is_constant_dim(d) else None for d in a_jax.shape]
-												Allow call_tf to accept shape-polymorphic inputs if the output shapes are fully static.

PiperOrigin-RevId: 501645235

											
										
										
											2023-01-12 13:04:09 -08:00
+								      return tf.TensorSpec(a_tf_shape, a_tf_dtype)
-												[jax2tf] Improved error checking for call_tf.

Cleaned up the abstract evaluation for call_tf to
work around a bug in TF whereby experimental_get_compiler_ir
cannot be used in a tf.function context.

Added more error messages, e.g., for the case when
the TF function has shape-influencing inputs.

											
										
										
											2021-07-10 18:49:25 +03:00
+								    args_flat_sig_tf = tuple(map(make_tensorspec, args_flat_jax))
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
-												Improve the default value of `output_shape_dtype`.

PiperOrigin-RevId: 549988693

											
										
										
											2023-07-21 10:43:03 -07:00
+								    if not isinstance(output_shape_dtype, UnspecifiedOutputShapeDtype):
-												[shape_poly, call_tf] Some improvements for call_tf in a shape polymorphic program

This is another attempt to land a rolled-back change https://github.com/google/jax/pull/14734 (cl/514070997).
See b/272154366 for more details.

The use case for call_tf with shape polymorphism is when we have a JAX program
that calls into TF function, and we want to serialize the JAX program with
some shapes unknown. Previously this use case did not work, except in the special
case when the output shape of the called TF function returns statically known
shapes.

The idea is that we allow the user of call_tf to specify the output shape.
This can be done even in presence of shape polymorphism, by writing the
output shape as an expression in terms of the input shapes. This is what
other JAX primitives do, e.g., concat, so we are simply enabling call_tf
to get the same behavior.

This change should be enough for old-style jax2tf, but will require more
work for native serialization.

We also removed some old code that was trying to workaround some limitations
in shape inference in TF. I think that those workarounds are ugly, and I am
prepared to give error messages rather than keep that code. So far no
tests fail.

PiperOrigin-RevId: 515137407

											
										
										
											2023-03-08 14:09:35 -08:00
+								      output_shape_dtype_flat, output_shape_dtype_tree = tree_util.tree_flatten(output_shape_dtype)
 								      output_avals = tuple(core.ShapedArray(st.shape, st.dtype) for st in output_shape_dtype_flat)
 								    else:
 								      output_avals, output_shape_dtype_tree = None, None
-												[call_tf] Improve error reporting

Add more checks to catch early the cases when the called TF function
returns values that are not convertible to JAX values (arrays of
numeric values). All these cases were resulting in errors even before
but sometimes these errors were deep in the stack and harder to
diagnose.

											
										
										
											2022-08-04 09:50:41 +03:00
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
+								    res_treedef = None  # We'll store here the result treedef
-												[call_tf] Improve error reporting

Add more checks to catch early the cases when the called TF function
returns values that are not convertible to JAX values (arrays of
numeric values). All these cases were resulting in errors even before
but sometimes these errors were deep in the stack and harder to
diagnose.

											
										
										
											2022-08-04 09:50:41 +03:00
+								    res_tf_flat = None  # For error reporting
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
+								    # The function below will be called at least once, either in eager
-												[shape_poly, call_tf] Some improvements for call_tf in a shape polymorphic program

This is another attempt to land a rolled-back change https://github.com/google/jax/pull/14734 (cl/514070997).
See b/272154366 for more details.

The use case for call_tf with shape polymorphism is when we have a JAX program
that calls into TF function, and we want to serialize the JAX program with
some shapes unknown. Previously this use case did not work, except in the special
case when the output shape of the called TF function returns statically known
shapes.

The idea is that we allow the user of call_tf to specify the output shape.
This can be done even in presence of shape polymorphism, by writing the
output shape as an expression in terms of the input shapes. This is what
other JAX primitives do, e.g., concat, so we are simply enabling call_tf
to get the same behavior.

This change should be enough for old-style jax2tf, but will require more
work for native serialization.

We also removed some old code that was trying to workaround some limitations
in shape inference in TF. I think that those workarounds are ugly, and I am
prepared to give error messages rather than keep that code. So far no
tests fail.

PiperOrigin-RevId: 515137407

											
										
										
											2023-03-08 14:09:35 -08:00
+								    # mode during jax2tf_call_tf or in graph mode during _get_concrete_function_tf()
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
+								    def callable_flat_tf(*args_tf_flat: TfVal) -> Sequence[TfVal]:
 								      args_tf = args_treedef.unflatten(args_tf_flat)
 								      res_tf = callable_tf(*args_tf)
-												Fix the problem for tf function return StatefulPartitionedCall during jax2tf.call_tf.

PiperOrigin-RevId: 529964653

											
										
										
											2023-05-06 08:29:45 -07:00
 								      # b/279454591: When `callable_tf` is a tf function with zero outputs, it
 								      # returns a `StatefulPartitionedCall` (if the function is stateful) or
 								      # `PartitionedCall` (if the function is stateless) op instead of
 								      # tf.Tensors. We work around this issue by replacing the output `res_tf`
 								      # with an empty list.
 								      if isinstance(res_tf, tf.Operation):
 								        assert (
 								            res_tf.type == "StatefulPartitionedCall"
 								            or res_tf.type == "PartitionedCall"
 								        )
 								        t_out = res_tf.get_attr("Tout")
 								        # t_out should be an empty list.
 								        assert not t_out, (
 								            "The TF function returned an unexpected result, please check its"
 								            f" function body. res_tf = {res_tf}"
 								        )
 								        res_tf = t_out
-												[call_tf] Improve error reporting

Add more checks to catch early the cases when the called TF function
returns values that are not convertible to JAX values (arrays of
numeric values). All these cases were resulting in errors even before
but sometimes these errors were deep in the stack and harder to
diagnose.

											
										
										
											2022-08-04 09:50:41 +03:00
+								      nonlocal res_treedef, res_tf_flat
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
+								      res_tf_flat, res_treedef_now = tree_util.tree_flatten(res_tf)
-												[shape_poly, call_tf] Some improvements for call_tf in a shape polymorphic program

This is another attempt to land a rolled-back change https://github.com/google/jax/pull/14734 (cl/514070997).
See b/272154366 for more details.

The use case for call_tf with shape polymorphism is when we have a JAX program
that calls into TF function, and we want to serialize the JAX program with
some shapes unknown. Previously this use case did not work, except in the special
case when the output shape of the called TF function returns statically known
shapes.

The idea is that we allow the user of call_tf to specify the output shape.
This can be done even in presence of shape polymorphism, by writing the
output shape as an expression in terms of the input shapes. This is what
other JAX primitives do, e.g., concat, so we are simply enabling call_tf
to get the same behavior.

This change should be enough for old-style jax2tf, but will require more
work for native serialization.

We also removed some old code that was trying to workaround some limitations
in shape inference in TF. I think that those workarounds are ugly, and I am
prepared to give error messages rather than keep that code. So far no
tests fail.

PiperOrigin-RevId: 515137407

											
										
										
											2023-03-08 14:09:35 -08:00
+								      assert res_treedef is None or res_treedef == res_treedef_now, (
 								          f"Subsequent calls had different results. Previous {res_treedef} and now {res_treedef_now}")
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
+								      res_treedef = res_treedef_now
-												[shape_poly, call_tf] Some improvements for call_tf in a shape polymorphic program

This is another attempt to land a rolled-back change https://github.com/google/jax/pull/14734 (cl/514070997).
See b/272154366 for more details.

The use case for call_tf with shape polymorphism is when we have a JAX program
that calls into TF function, and we want to serialize the JAX program with
some shapes unknown. Previously this use case did not work, except in the special
case when the output shape of the called TF function returns statically known
shapes.

The idea is that we allow the user of call_tf to specify the output shape.
This can be done even in presence of shape polymorphism, by writing the
output shape as an expression in terms of the input shapes. This is what
other JAX primitives do, e.g., concat, so we are simply enabling call_tf
to get the same behavior.

This change should be enough for old-style jax2tf, but will require more
work for native serialization.

We also removed some old code that was trying to workaround some limitations
in shape inference in TF. I think that those workarounds are ugly, and I am
prepared to give error messages rather than keep that code. So far no
tests fail.

PiperOrigin-RevId: 515137407

											
										
										
											2023-03-08 14:09:35 -08:00
+								      if output_avals is not None:
 								        if res_treedef != output_shape_dtype_tree:
 								          raise ValueError(
 								              "The pytree of the TensorFlow function results does not match the "
 								              "pytree of the declared output_shape_dtype:\n"
 								              f"results pytree: {res_treedef}\noutput_shape_dtype tree: {output_shape_dtype_tree}")
 								        assert len(output_avals) == len(res_tf_flat)
-												[2/n] Embed the tf.Graph into the stablehlo.custom_call.

PiperOrigin-RevId: 527302563

											
										
										
											2023-04-26 10:20:12 -07:00
+								      checked_res_tf_flat = [
 								          check_tf_result(i, r_tf, r_aval)
 								          for i, (r_tf, r_aval) in enumerate(
-												[call_tf] Some cleanup of call_tf

The main cleanup is around _code_generator_and_avals, which in
an earlier version of the code was used for both abstract values
and for code generation. That is why it was cached, and why it
returned a code generator and abstract values. A while
ago we did a first round of cleaning to not use it for abstract
values. Now we can actually eliminate the function and inline
it directly.

A second improvement is to add the explicit error message from
TF commpilation, instead of just the generic message that
call_tf cannot be used with non-compileable functions.

											
										
										
											2023-04-27 13:42:23 +02:00
+								              zip(res_tf_flat,
 								                  (output_avals
 								                   if output_avals is not None
 								                   else (None,) * len(res_tf_flat))))]
-												[2/n] Embed the tf.Graph into the stablehlo.custom_call.

PiperOrigin-RevId: 527302563

											
										
										
											2023-04-26 10:20:12 -07:00
+								      return checked_res_tf_flat
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
 								    # Prepare a tf.function ahead of time, to cache the concrete functions. This
 								    # won't be used in op-by-op execution mode.
-												[2/n] Embed the tf.Graph into the stablehlo.custom_call.

PiperOrigin-RevId: 527302563

											
										
										
											2023-04-26 10:20:12 -07:00
+								    function_flat_tf = tf.function(
-												Bump XLACallModule to version 5 and add the function_list.

PiperOrigin-RevId: 529106145

											
										
										
											2023-05-03 09:04:01 -07:00
+								        callable_flat_tf, autograph=False, jit_compile=not call_tf_graph)
-												[call_tf] Fixed the handling of x64 values in JAX_ENABLE_X64=False

TensorFlow interprets Python scalars in x64 mode, or it may contain
explicit x64 computation. When used with call_tf, we canonicalize
inputs and outputs using the JAX rules.

											
										
										
											2021-06-16 13:25:56 +03:00
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
+								    res_jax_flat = call_tf_p.bind(
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
+								        *args_flat_jax,
-												[jax2tf] Fix the round-trip call_tf(convert)

Also cleaned the handling of global state in jax2tf.

											
										
										
											2021-06-10 17:01:22 +02:00
+								        # Carry the actual function such that op-by-op call can call in TF eager mode.
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
+								        callable_flat_tf=callable_flat_tf,
 								        function_flat_tf=function_flat_tf,
-												[call_tf] Add has_side_effects parameter

The CallTfEffect was added recently as an internal workaround for
DCE removing instances of call_tf. Here we add a parameter to
`call_tf` to be able to declare if the called computation is
effectful and should not be removed by DCE.

											
										
										
											2023-01-12 08:44:53 +01:00
+								        args_flat_sig_tf=args_flat_sig_tf,
-												[shape_poly, call_tf] Some improvements for call_tf in a shape polymorphic program

This is another attempt to land a rolled-back change https://github.com/google/jax/pull/14734 (cl/514070997).
See b/272154366 for more details.

The use case for call_tf with shape polymorphism is when we have a JAX program
that calls into TF function, and we want to serialize the JAX program with
some shapes unknown. Previously this use case did not work, except in the special
case when the output shape of the called TF function returns statically known
shapes.

The idea is that we allow the user of call_tf to specify the output shape.
This can be done even in presence of shape polymorphism, by writing the
output shape as an expression in terms of the input shapes. This is what
other JAX primitives do, e.g., concat, so we are simply enabling call_tf
to get the same behavior.

This change should be enough for old-style jax2tf, but will require more
work for native serialization.

We also removed some old code that was trying to workaround some limitations
in shape inference in TF. I think that those workarounds are ugly, and I am
prepared to give error messages rather than keep that code. So far no
tests fail.

PiperOrigin-RevId: 515137407

											
										
										
											2023-03-08 14:09:35 -08:00
+								        output_avals=output_avals,
-												[1/n] store embedded tf.graph to stablehlo.custom_call

PiperOrigin-RevId: 519194911

											
										
										
											2023-03-24 11:26:44 -07:00
+								        has_side_effects=has_side_effects,
-												Add (optional) ordered effects for `jax2tf.call_tf`

This allows users to express nested TensorFlow computation that must be ordered during execution. It leverages the existing JAX effects system to model such side effects and lower them to use XLA tokens.

With this change, `jax2tf.call_tf(ordered=True)` can be used to generate ordered TF calls. This has the following behavior:

* With `call_tf_graph=True`, this generates a custom call op with the following differences: (1) a `!stablehlo.token` argument/result is prepended to each custom call's argument/result list and (2) `tf.backend_config` has an additional `has_token_input_output = true` entry.
* Without `call_tf_graph=True`, this raises a `NotImplementedError()`.

For this, `jax_export.py` makes sure that dummy arguments/results added for ordered effects are not exposed to the public interface by passing constant values in a wrapper function. Because of this, adding ordered effects to jax2tf-ed computation no longer causes calling convention changes and can be safely allowed.

Example StableHLO produced from the added test:

```
module @jit_f_jax attributes {mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
  func.func public @main(%arg0: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.constant dense<> : tensor<0xi1>
    %1:2 = call @_wrapped_jax_export_main(%0, %arg0) : (tensor<0xi1>, tensor<f32>) -> (tensor<0xi1>, tensor<f32>)
    return %1#1 : tensor<f32>
  }
  func.func private @_wrapped_jax_export_main(%arg0: tensor<0xi1> {jax.token = true}, %arg1: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<0xi1> {jax.token = true}, tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.create_token : !stablehlo.token
    %1 = stablehlo.constant dense<0> : tensor<i32>
    %2:3 = stablehlo.while(%iterArg = %0, %iterArg_0 = %1, %iterArg_1 = %arg1) : !stablehlo.token, tensor<i32>, tensor<f32>
     cond {
      %4 = stablehlo.constant dense<4> : tensor<i32>
      %5 = stablehlo.compare  LT, %iterArg_0, %4,  SIGNED : (tensor<i32>, tensor<i32>) -> tensor<i1>
      stablehlo.return %5 : tensor<i1>
    } do {
      %4 = stablehlo.custom_call @tf.call_tf_function(%iterArg, %iterArg_1) {api_version = 2 : i32, has_side_effect = true, tf.backend_config = {caller_name = "__inference_callable_flat_tf_10", has_token_input_output = true}} : (!stablehlo.token, tensor<f32>) -> !stablehlo.token
      %5 = stablehlo.constant dense<1.000000e+00> : tensor<f32>
      %6 = stablehlo.add %iterArg_1, %5 : tensor<f32>
      %7 = stablehlo.constant dense<1> : tensor<i32>
      %8 = stablehlo.add %iterArg_0, %7 : tensor<i32>
      stablehlo.return %4, %8, %6 : !stablehlo.token, tensor<i32>, tensor<f32>
    }
    %3 = stablehlo.constant dense<> : tensor<0xi1>
    return %3, %2#2 : tensor<0xi1>, tensor<f32>
  }
}
```

PiperOrigin-RevId: 534926215

											
										
										
											2023-05-24 11:47:58 -07:00
+								        ordered=ordered,
 								        call_tf_graph=call_tf_graph,
 								    )
-												[call_tf] Improve error reporting

Add more checks to catch early the cases when the called TF function
returns values that are not convertible to JAX values (arrays of
numeric values). All these cases were resulting in errors even before
but sometimes these errors were deep in the stack and harder to
diagnose.

											
										
										
											2022-08-04 09:50:41 +03:00
-												[shape_poly, call_tf] Some improvements for call_tf in a shape polymorphic program

This is another attempt to land a rolled-back change https://github.com/google/jax/pull/14734 (cl/514070997).
See b/272154366 for more details.

The use case for call_tf with shape polymorphism is when we have a JAX program
that calls into TF function, and we want to serialize the JAX program with
some shapes unknown. Previously this use case did not work, except in the special
case when the output shape of the called TF function returns statically known
shapes.

The idea is that we allow the user of call_tf to specify the output shape.
This can be done even in presence of shape polymorphism, by writing the
output shape as an expression in terms of the input shapes. This is what
other JAX primitives do, e.g., concat, so we are simply enabling call_tf
to get the same behavior.

This change should be enough for old-style jax2tf, but will require more
work for native serialization.

We also removed some old code that was trying to workaround some limitations
in shape inference in TF. I think that those workarounds are ugly, and I am
prepared to give error messages rather than keep that code. So far no
tests fail.

PiperOrigin-RevId: 515137407

											
										
										
											2023-03-08 14:09:35 -08:00
+								    # We must have called callable_flat_tf by nοw
-												[call_tf] Improve error reporting

Add more checks to catch early the cases when the called TF function
returns values that are not convertible to JAX values (arrays of
numeric values). All these cases were resulting in errors even before
but sometimes these errors were deep in the stack and harder to
diagnose.

											
										
										
											2022-08-04 09:50:41 +03:00
+								    assert res_treedef is not None
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
+								    return res_treedef.unflatten(res_jax_flat)
 								  # Define the fwd and bwd custom_vjp functions
 								  def make_call_vjp_fwd(*args_jax):
-												[jax2tf] Fix the custom gradients for call_tf

The previous implementation did not work correctly when
the call_tf function was embedded in a larger JAX function
for which we take the gradient.

Also fixed handling of non-float args/results.

											
										
										
											2021-06-16 10:20:24 +03:00
+								    # Return the primal arguments as the residual
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
+								    return make_call(*args_jax), args_jax
-												[jax2tf] Fix the custom gradients for call_tf

The previous implementation did not work correctly when
the call_tf function was embedded in a larger JAX function
for which we take the gradient.

Also fixed handling of non-float args/results.

											
										
										
											2021-06-16 10:20:24 +03:00
+								  def make_call_vjp_bwd(residual_jax, ct_res_jax):
 								    args_jax = residual_jax  # residual is the primal argument
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
-												[jax2tf] Fix the custom gradients for call_tf

The previous implementation did not work correctly when
the call_tf function was embedded in a larger JAX function
for which we take the gradient.

Also fixed handling of non-float args/results.

											
										
										
											2021-06-16 10:20:24 +03:00
+								    def tf_vjp_fun(args_tf, ct_res_tf):
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
+								      """Invoke TF gradient."""
-												[jax2tf] Fix the custom gradients for call_tf

The previous implementation did not work correctly when
the call_tf function was embedded in a larger JAX function
for which we take the gradient.

Also fixed handling of non-float args/results.

											
										
										
											2021-06-16 10:20:24 +03:00
-												Support `None` leaves in arguments to gradient of a call_tf wrapped function.

PiperOrigin-RevId: 662115139

											
										
										
											2024-08-12 09:23:40 -07:00
+								      # TF does not like us to watch non-float vars or Nones.
 								      def replace_non_float_or_none(arg_tf):
 								        if arg_tf is not None and (
 								            arg_tf.dtype.is_floating or arg_tf.dtype.is_complex
 								        ):
-												Fix the simple bug on call_tf.replace_non_float and add unittest for floating and complex data type.

PiperOrigin-RevId: 510055139

											
										
										
											2023-02-15 23:40:12 -08:00
+								          return arg_tf
-												[jax2tf] Fix the custom gradients for call_tf

The previous implementation did not work correctly when
the call_tf function was embedded in a larger JAX function
for which we take the gradient.

Also fixed handling of non-float args/results.

											
										
										
											2021-06-16 10:20:24 +03:00
+								        else:
-												[call_tf] Some cleanup of call_tf

The main cleanup is around _code_generator_and_avals, which in
an earlier version of the code was used for both abstract values
and for code generation. That is why it was cached, and why it
returned a code generator and abstract values. A while
ago we did a first round of cleaning to not use it for abstract
values. Now we can actually eliminate the function and inline
it directly.

A second improvement is to add the explicit error message from
TF commpilation, instead of just the generic message that
call_tf cannot be used with non-compileable functions.

											
										
										
											2023-04-27 13:42:23 +02:00
+								          # When watched, this will be ignored. When used in results it will
-												[jax2tf] Fix the custom gradients for call_tf

The previous implementation did not work correctly when
the call_tf function was embedded in a larger JAX function
for which we take the gradient.

Also fixed handling of non-float args/results.

											
										
										
											2021-06-16 10:20:24 +03:00
+								          # result in a floating 0. gradient, which JAX will ignore (and
 								          # replace it with a float0)
 								          return tf.zeros((), dtype=tf.float32)
-												Support `None` leaves in arguments to gradient of a call_tf wrapped function.

PiperOrigin-RevId: 662115139

											
										
										
											2024-08-12 09:23:40 -07:00
+								      watched_args_tf = tf.nest.map_structure(
 								          replace_non_float_or_none, args_tf
 								      )
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
+								      with tf.GradientTape(persistent=True) as tape:
-												[jax2tf] Fix the custom gradients for call_tf

The previous implementation did not work correctly when
the call_tf function was embedded in a larger JAX function
for which we take the gradient.

Also fixed handling of non-float args/results.

											
										
										
											2021-06-16 10:20:24 +03:00
+								        tape.watch(watched_args_tf)
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
+								        res = callable_tf(*args_tf)
-												[jax2tf] Fix the custom gradients for call_tf

The previous implementation did not work correctly when
the call_tf function was embedded in a larger JAX function
for which we take the gradient.

Also fixed handling of non-float args/results.

											
										
										
											2021-06-16 10:20:24 +03:00
 								      tf.nest.assert_same_structure(res, ct_res_tf)
 								      dres_darg = tape.gradient(
-												Support `None` leaves in arguments to gradient of a call_tf wrapped function.

PiperOrigin-RevId: 662115139

											
										
										
											2024-08-12 09:23:40 -07:00
+								          tf.nest.map_structure(replace_non_float_or_none, res),
-												[jax2tf] Fix the custom gradients for call_tf

The previous implementation did not work correctly when
the call_tf function was embedded in a larger JAX function
for which we take the gradient.

Also fixed handling of non-float args/results.

											
										
										
											2021-06-16 10:20:24 +03:00
+								          sources=watched_args_tf,
 								          output_gradients=ct_res_tf,
-												Support `None` leaves in arguments to gradient of a call_tf wrapped function.

PiperOrigin-RevId: 662115139

											
										
										
											2024-08-12 09:23:40 -07:00
+								          unconnected_gradients=tf.UnconnectedGradients.ZERO,
 								      )
-												[jax2tf] Fix the custom gradients for call_tf

The previous implementation did not work correctly when
the call_tf function was embedded in a larger JAX function
for which we take the gradient.

Also fixed handling of non-float args/results.

											
										
										
											2021-06-16 10:20:24 +03:00
-												Add tf.convert_to_tensor for call_tf gradient outputs.

PiperOrigin-RevId: 510453014

											
										
										
											2023-02-17 09:38:41 -08:00
+								      dres_darg = tree_util.tree_map(
 								          lambda x: x if x is None else tf.convert_to_tensor(x),
 								          dres_darg,
 								      )
-												Relaxed the assertion for is_same_structure in `jax2tf.call_tf` so that `tf_fun` may mutate the structure of its input parameters.

PiperOrigin-RevId: 665919824

											
										
										
											2024-08-21 09:48:59 -07:00
 								      # callable_tf may mutate (the structure of) args_tf, thus we check against
 								      # watched_args_tf which should be structurally the same as the original
 								      # args_tf.
 								      tf.nest.assert_same_structure(dres_darg, watched_args_tf)
-												[jax2tf] Fix the custom gradients for call_tf

The previous implementation did not work correctly when
the call_tf function was embedded in a larger JAX function
for which we take the gradient.

Also fixed handling of non-float args/results.

											
										
										
											2021-06-16 10:20:24 +03:00
+								      return dres_darg
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
+								    # Use call_tf to call the VJP function
-												[jax2tf] A few fixed for handling of float0 in jax2tf and call_tf

TF returns None or 0 for the gradients of functions with integer
arguments. JAX expects float0. We must convert to and from float0
at the JAX-TF boundary.

											
										
										
											2021-06-29 14:57:42 +03:00
+								    ct_args_jax = call_tf(tf_vjp_fun)(args_jax, ct_res_jax)
 								    # We must make the float0s that JAX expects
 								    def fix_float0(arg_jax, ct_arg_jax):
-												Update users of jax.tree.map() to be more careful about how they handle Nones.

Due to a bug in JAX, JAX previously permitted `jax.tree.map(f, None, x)` where `x` is not `None`, effectively treating `None` as if it were pytree-prefix of any value. But `None` is a pytree container, and it is only a prefix of `None` itself.

Fix code that was relying on this bug. Most commonly, the fix is to write
`jax.tree.map(lambda a, b: (None if a is None else f(a, b)), x, y, is_leaf=lambda t: t is None)`.

PiperOrigin-RevId: 673258116

											
										
										
											2024-09-10 23:53:24 -07:00
+								      if arg_jax is None:
 								        return None
-												[jax2tf] A few fixed for handling of float0 in jax2tf and call_tf

TF returns None or 0 for the gradients of functions with integer
arguments. JAX expects float0. We must convert to and from float0
at the JAX-TF boundary.

											
										
										
											2021-06-29 14:57:42 +03:00
+								      arg_dtype = dtypes.result_type(arg_jax)  # May be scalar
 								      ct_arg_dtype = core.primal_dtype_to_tangent_dtype(arg_dtype)
 								      if ct_arg_dtype != ct_arg_jax.dtype:
 								        return ad_util.zeros_like_aval(core.ShapedArray(np.shape(arg_jax),
 								                                                        ct_arg_dtype))
 								      return ct_arg_jax
-												Update users of jax.tree.map() to be more careful about how they handle Nones.

Due to a bug in JAX, JAX previously permitted `jax.tree.map(f, None, x)` where `x` is not `None`, effectively treating `None` as if it were pytree-prefix of any value. But `None` is a pytree container, and it is only a prefix of `None` itself.

Fix code that was relying on this bug. Most commonly, the fix is to write
`jax.tree.map(lambda a, b: (None if a is None else f(a, b)), x, y, is_leaf=lambda t: t is None)`.

PiperOrigin-RevId: 673258116

											
										
										
											2024-09-10 23:53:24 -07:00
+								    ct_args_jax_fixed = tree_util.tree_map(fix_float0, args_jax, ct_args_jax,
 								                                           is_leaf=lambda x: x is None)
-												[jax2tf] A few fixed for handling of float0 in jax2tf and call_tf

TF returns None or 0 for the gradients of functions with integer
arguments. JAX expects float0. We must convert to and from float0
at the JAX-TF boundary.

											
										
										
											2021-06-29 14:57:42 +03:00
+								    return ct_args_jax_fixed
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
 								  make_call.defvjp(make_call_vjp_fwd, make_call_vjp_bwd)
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
+								  return util.wraps(callable_tf)(make_call)
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
-												Upgrade remaining sources to Python 3.9

This PR is a follow up to #18881.

The changes were generated by adding

    from __future__ import annotations

to the files which did not already have them and running

    pyupgrade --py39-plus --keep-percent-format {jax,tests,jaxlib,examples,benchmarks}/**/*.py

											
										
										
											2023-12-11 13:59:29 +00:00
+								def check_tf_result(idx: int, r_tf: TfVal, r_aval: core.ShapedArray | None) -> TfVal:
-												[shape_poly, call_tf] Some improvements for call_tf in a shape polymorphic program

This is another attempt to land a rolled-back change https://github.com/google/jax/pull/14734 (cl/514070997).
See b/272154366 for more details.

The use case for call_tf with shape polymorphism is when we have a JAX program
that calls into TF function, and we want to serialize the JAX program with
some shapes unknown. Previously this use case did not work, except in the special
case when the output shape of the called TF function returns statically known
shapes.

The idea is that we allow the user of call_tf to specify the output shape.
This can be done even in presence of shape polymorphism, by writing the
output shape as an expression in terms of the input shapes. This is what
other JAX primitives do, e.g., concat, so we are simply enabling call_tf
to get the same behavior.

This change should be enough for old-style jax2tf, but will require more
work for native serialization.

We also removed some old code that was trying to workaround some limitations
in shape inference in TF. I think that those workarounds are ugly, and I am
prepared to give error messages rather than keep that code. So far no
tests fail.

PiperOrigin-RevId: 515137407

											
										
										
											2023-03-08 14:09:35 -08:00
+								  # Check that the TF function returns values of expected types. This
 								  # improves error reporting, preventing hard-to-diagnose errors downstream
 								  try:
 								    jax2tf_internal._tfval_to_tensor_jax_dtype(r_tf)
 								  except Exception as e:
 								    msg = ("The called TF function returns a result that is not "
 								           f"convertible to JAX: {r_tf}.")
 								    raise ValueError(msg) from e
 								  if r_aval is None:
 								    return r_tf
 								  # We convert to TF type, and canonicalize to 32-bit if necessary
 								  r_aval_dtype_tf = jax2tf_internal._to_tf_dtype(r_aval.dtype)
 								  # Checking shapes is trickier in presence of dynamic shapes. I wish we could
 								  # check at runtime that the returned shape matches the declared shape. I wish
 								  # that tf.ensure_shape did this, but it can only take shapes that contain None
 								  # not computed shapes. However, in eager mode we should be able to resolve
 								  # the declared shapes to constants and we get better checking.
 								  if tf.executing_eagerly():
 								    r_aval_shape_tf = jax2tf_internal._eval_shape(r_aval.shape)
 								  else:
 								    r_aval_shape_tf = jax2tf_internal._aval_to_tf_shape(r_aval)
 								  # We do as much checking as we can here, instead of relying on tf.ensure_shape
 								  # because the latter gives different errors in eager vs. compiled mode.
-												[2/n] Embed the tf.Graph into the stablehlo.custom_call.

PiperOrigin-RevId: 527302563

											
										
										
											2023-04-26 10:20:12 -07:00
+								  # TODO(b/279454591): This strange error is from TF. Eager function suppose
 								  # return tf Val with concrete shape but not.  Here we change exception to warn
 								  # and bypass it. This case need revisit on TF side.
 								  try:
 								    _ = len(r_tf.shape)
 								  except ValueError as e:
 								    msg = (
 								        "The shape check test cannot be performed because the shape of the"
 								        "`r_tf` tensor cannot be obtained."
 								        f"r_tf = {r_tf}, r_aval = {r_aval}"
 								    )
 								    msg += str(e)
 								    logging.warning(msg)
 								    return r_tf
-												[shape_poly, call_tf] Some improvements for call_tf in a shape polymorphic program

This is another attempt to land a rolled-back change https://github.com/google/jax/pull/14734 (cl/514070997).
See b/272154366 for more details.

The use case for call_tf with shape polymorphism is when we have a JAX program
that calls into TF function, and we want to serialize the JAX program with
some shapes unknown. Previously this use case did not work, except in the special
case when the output shape of the called TF function returns statically known
shapes.

The idea is that we allow the user of call_tf to specify the output shape.
This can be done even in presence of shape polymorphism, by writing the
output shape as an expression in terms of the input shapes. This is what
other JAX primitives do, e.g., concat, so we are simply enabling call_tf
to get the same behavior.

This change should be enough for old-style jax2tf, but will require more
work for native serialization.

We also removed some old code that was trying to workaround some limitations
in shape inference in TF. I think that those workarounds are ugly, and I am
prepared to give error messages rather than keep that code. So far no
tests fail.

PiperOrigin-RevId: 515137407

											
										
										
											2023-03-08 14:09:35 -08:00
+								  if (r_tf.dtype != r_aval_dtype_tf or
 								      len(r_tf.shape) != len(r_aval_shape_tf) or
 								      any(r_aval_d is not None and r_tf_d is not None and r_aval_d != r_tf_d
 								          for r_tf_d, r_aval_d in zip(r_tf.shape, r_aval_shape_tf))):
 								    msg = ("The shapes or dtypes returned by the TensorFlow function "
 								           "do not match the declared output_shape_dtype:\n"
 								           f"Result[{idx}] is {r_tf.dtype}[{r_tf.shape}] vs. expected {r_aval_dtype_tf}[{r_aval_shape_tf}]")
 								    raise ValueError(msg)
 								  # At this point tf.ensure_shape does not do much, it should never throw an
 								  # error, albeit it may refine the shape a bit.
 								  return tf.ensure_shape(r_tf, r_aval_shape_tf)
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
+								call_tf_p = core.Primitive("call_tf")
 								call_tf_p.multiple_results = True
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
+								# The impl will be used in op-by-op mode and calls callable_tf in TF eager mode.
 								def _call_tf_impl(*args_jax_flat, callable_flat_tf, **_):
-												[call_tf] Add support for DLPack to avoid copying arrays in eager mode

											
										
										
											2021-02-05 12:04:25 +02:00
+								  # On GPU we use dlpack to avoid copies of data to the host.
 								  def _arg_jax_to_tf(arg_jax):
-												[JAX] Replace uses of jax.interpreters.xla.DeviceArray with jax.Array.

PiperOrigin-RevId: 508822404

											
										
										
											2023-02-10 20:56:02 -08:00
+								    if (isinstance(arg_jax, jax.Array) and
-												Make the device check works when the number of devices is larger than one.

PiperOrigin-RevId: 538760855

											
										
										
											2023-06-08 05:51:00 -07:00
+								        list(arg_jax.devices())[0].platform in _DLPACK_PLATFORMS and
-												Fix unnecessary memory copies between GPU and CPU when `jax2tf.call_tf()` is used.

- The root cause of the bug is that dtype lookups are incorrect because hashes behave differently between dtype instances and their types. Added comments to `jax.dlpack.SUPPORTED_DTYPES` about this.
- Added unit test coverage.
- Fixing this bug revealed a limitation of causing "host-to-device" copy in the following two situations. See the details in the unit test comments.:
  - When the dtype is 'int32'.
  - When using PJRT C API runtime.

PiperOrigin-RevId: 610799558

											
										
										
											2024-02-27 10:35:03 -08:00
+								        arg_jax.dtype.type in dlpack.SUPPORTED_DTYPES):
-												Add support for max_version, dl_device, copy kwargs in __dlpack__

											
										
										
											2024-04-11 16:44:19 +00:00
+								      arg_dlpack = jax.dlpack.to_dlpack(arg_jax)
-												[call_tf] Add support for DLPack to avoid copying arrays in eager mode

											
										
										
											2021-02-05 12:04:25 +02:00
+								      return tf.experimental.dlpack.from_dlpack(arg_dlpack)
-												Replace references to DeviceArray with Array.

A number of stale references are lurking in our documentation.

											
										
										
											2023-08-18 16:50:36 -04:00
+								    # The following avoids copies to the host on CPU, always for Array
-												[call_tf] Add support for DLPack to avoid copying arrays in eager mode

											
										
										
											2021-02-05 12:04:25 +02:00
+								    # and even for ndarray if they are sufficiently aligned.
 								    # TODO(necula): on TPU this copies to the host!
-												revise logic for tangent types of extended dtypes

* remove the dead code KeyTangentTy
* replace TyRules.make_tangent with TyRules.zero
* removed ad.instantiate_zeros_aval, which was redundant with ad.instantiate_zeros ever since (1) we removed units and (2) we made Zero carry an aval on it
* fix a bug in backward_pass where we instantiated a Zero at the primal type rather than the corresponding tangent type
* fix _f_bwd in test_keyarray_custom_vjp, which had the wrong type (need to return cotangents for all inputs, we were returning a (float_tangent, key_tangent) pair instead of a (float_tangent, (float_tangent, key_tangent)) nested tuple, see #19009 for a check which catches this and hence includes the same test change

We probably also need a TyRules.add for any extended dtypes that can occur as tangent dtypes, but we currently don't have any tests that exercise that (because all extended dtype tangent types are currently float0). I have some follow-up work to add such a case though!

											
										
										
											2023-12-20 12:47:43 -08:00
+								    if getattr(arg_jax, 'dtype', None) == dtypes.float0:
 								      return tf.zeros(shape=arg_jax.shape,
 								                      dtype=jax2tf_internal._tf_np_dtype_for_float0)
-												[call_tf] Add support for DLPack to avoid copying arrays in eager mode

											
										
										
											2021-02-05 12:04:25 +02:00
+								    return tf.constant(np.asarray(arg_jax))
 								  args_tf_flat = tuple(map(_arg_jax_to_tf, args_jax_flat))
-												[jax2tf] Fix the round-trip call_tf(convert)

Also cleaned the handling of global state in jax2tf.

											
										
										
											2021-06-10 17:01:22 +02:00
+								  with jax2tf_internal.inside_call_tf():
 								    # Call in TF eager mode
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
+								    res_tf_flat = callable_flat_tf(*args_tf_flat)
-												[call_tf] Add support for DLPack to avoid copying arrays in eager mode

											
										
										
											2021-02-05 12:04:25 +02:00
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
+								  def _res_tf_to_jax(res_tf: TfVal):
-												Fix unnecessary memory copies between GPU and CPU when `jax2tf.call_tf()` is used.

- The root cause of the bug is that dtype lookups are incorrect because hashes behave differently between dtype instances and their types. Added comments to `jax.dlpack.SUPPORTED_DTYPES` about this.
- Added unit test coverage.
- Fixing this bug revealed a limitation of causing "host-to-device" copy in the following two situations. See the details in the unit test comments.:
  - When the dtype is 'int32'.
  - When using PJRT C API runtime.

PiperOrigin-RevId: 610799558

											
										
										
											2024-02-27 10:35:03 -08:00
+								    res_tf, jax_dtype = jax2tf_internal._tfval_to_tensor_jax_dtype(res_tf)
 								    if isinstance(res_tf, tf.Tensor) and jax_dtype.type in dlpack.SUPPORTED_DTYPES:
-												[call_tf] Add support for DLPack to avoid copying arrays in eager mode

											
										
										
											2021-02-05 12:04:25 +02:00
+								      res_tf_platform = tf.DeviceSpec.from_string(res_tf.backing_device).device_type
 								      res_jax_platform = res_tf_platform.lower()
-												[PJRT C API] Enable PJRT C API runtime in jax2tf dlpack.

GetDefaultLayout added a fallback for GPU backend so it is no longer blocked by the fact that PJRT C API does not support GetDefaultLayout yet.

PiperOrigin-RevId: 632555239

											
										
										
											2024-05-10 11:29:49 -07:00
+								      if res_jax_platform in _DLPACK_PLATFORMS:
-												[call_tf] Add support for DLPack to avoid copying arrays in eager mode

											
										
										
											2021-02-05 12:04:25 +02:00
+								        res_dlpack = tf.experimental.dlpack.to_dlpack(res_tf)
-												[JAX] Improve support for DLPack tensors on CPU when a GPU is available.

https://github.com/google/jax/issues/5581

Previously the user had to provide the target backend explicitly. Now we supply both CPU and GPU backends to the C++ code so it can choose based on the metadata of the DLPack tensor.

PiperOrigin-RevId: 380795192

											
										
										
											2021-06-22 06:38:22 -07:00
+								        return jax.dlpack.from_dlpack(res_dlpack)
-												[call_tf] Add support for DLPack to avoid copying arrays in eager mode

											
										
										
											2021-02-05 12:04:25 +02:00
-												Fix the simple bug on call_tf.replace_non_float and add unittest for floating and complex data type.

PiperOrigin-RevId: 510055139

											
										
										
											2023-02-15 23:40:12 -08:00
+								    # When working with a bfloat16 scalar tf.Tensor,np.asarray() can fail.
 								    # To handle this special case, we create a numpy copy.
 								    if res_tf.shape == tf.TensorShape([]) and res_tf.dtype == tf.bfloat16:
 								      return jax.device_put(jnp.array(res_tf.numpy()))
 								    else:
 								      return jax.device_put(np.asarray(res_tf))
-												[call_tf] Add support for DLPack to avoid copying arrays in eager mode

											
										
										
											2021-02-05 12:04:25 +02:00
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
+								  return list(map(_res_tf_to_jax, res_tf_flat))
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
 								call_tf_p.def_impl(_call_tf_impl)
-												[call_tf] Use the same platform for TF lowering as the embedding JAX computation

This requires some changes for abstract evaluation, when
JAX does not use a specific platform.

Also attempt to fix the case when the TF lowering fails because the TF computation
uses a tf.Variable on another device as that used for lowering.

PiperOrigin-RevId: 492112847

											
										
										
											2022-11-30 23:21:55 -08:00
+								@functools.lru_cache(maxsize=128)
 								def _get_concrete_function_tf(function_flat_tf, args_flat_sig_tf):  # -> tf.ConcreteFunction
 								  with jax2tf_internal.inside_call_tf():
 								    return function_flat_tf.get_concrete_function(*args_flat_sig_tf)
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
-												Refactor effects system to use effect types, not objects

											
										
										
											2023-02-01 17:50:00 -08:00
+								# Mark the effectful instances of call_tf
-												[export] Fix the serialization of effects

We currently support only the serialization of effects with
nullary constructors. We must also ensure that upon deserialization
we produce an event that tests equal to the original one.
Here we add explicit error checks and tests.

We also make the CallTfEffect to have this property.

											
										
										
											2023-12-13 15:43:12 +01:00
+								@dataclasses.dataclass(frozen=True)
-												Refactor effects system to use effect types, not objects

											
										
										
											2023-02-01 17:50:00 -08:00
+								class CallTfEffect(effects.Effect):
 								  __str__ = lambda _: "CallTfEffect"
 								call_tf_effect = CallTfEffect()
-												Make `call_tf`'s abstract eval rule effectful so that JAX's DCE pass doesn't prune the arguments passed to it.

PiperOrigin-RevId: 496022997

											
										
										
											2022-12-16 20:42:19 -08:00
-												Refactor effects system to use effect types, not objects

											
										
										
											2023-02-01 17:50:00 -08:00
+								effects.lowerable_effects.add_type(CallTfEffect)
 								effects.control_flow_allowed_effects.add_type(CallTfEffect)
 								effects.remat_allowed_effects.add_type(CallTfEffect)
 								effects.custom_derivatives_allowed_effects.add_type(CallTfEffect)
-												Make `call_tf`'s abstract eval rule effectful so that JAX's DCE pass doesn't prune the arguments passed to it.

PiperOrigin-RevId: 496022997

											
										
										
											2022-12-16 20:42:19 -08:00
-												Add (optional) ordered effects for `jax2tf.call_tf`

This allows users to express nested TensorFlow computation that must be ordered during execution. It leverages the existing JAX effects system to model such side effects and lower them to use XLA tokens.

With this change, `jax2tf.call_tf(ordered=True)` can be used to generate ordered TF calls. This has the following behavior:

* With `call_tf_graph=True`, this generates a custom call op with the following differences: (1) a `!stablehlo.token` argument/result is prepended to each custom call's argument/result list and (2) `tf.backend_config` has an additional `has_token_input_output = true` entry.
* Without `call_tf_graph=True`, this raises a `NotImplementedError()`.

For this, `jax_export.py` makes sure that dummy arguments/results added for ordered effects are not exposed to the public interface by passing constant values in a wrapper function. Because of this, adding ordered effects to jax2tf-ed computation no longer causes calling convention changes and can be safely allowed.

Example StableHLO produced from the added test:

```
module @jit_f_jax attributes {mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
  func.func public @main(%arg0: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.constant dense<> : tensor<0xi1>
    %1:2 = call @_wrapped_jax_export_main(%0, %arg0) : (tensor<0xi1>, tensor<f32>) -> (tensor<0xi1>, tensor<f32>)
    return %1#1 : tensor<f32>
  }
  func.func private @_wrapped_jax_export_main(%arg0: tensor<0xi1> {jax.token = true}, %arg1: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<0xi1> {jax.token = true}, tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.create_token : !stablehlo.token
    %1 = stablehlo.constant dense<0> : tensor<i32>
    %2:3 = stablehlo.while(%iterArg = %0, %iterArg_0 = %1, %iterArg_1 = %arg1) : !stablehlo.token, tensor<i32>, tensor<f32>
     cond {
      %4 = stablehlo.constant dense<4> : tensor<i32>
      %5 = stablehlo.compare  LT, %iterArg_0, %4,  SIGNED : (tensor<i32>, tensor<i32>) -> tensor<i1>
      stablehlo.return %5 : tensor<i1>
    } do {
      %4 = stablehlo.custom_call @tf.call_tf_function(%iterArg, %iterArg_1) {api_version = 2 : i32, has_side_effect = true, tf.backend_config = {caller_name = "__inference_callable_flat_tf_10", has_token_input_output = true}} : (!stablehlo.token, tensor<f32>) -> !stablehlo.token
      %5 = stablehlo.constant dense<1.000000e+00> : tensor<f32>
      %6 = stablehlo.add %iterArg_1, %5 : tensor<f32>
      %7 = stablehlo.constant dense<1> : tensor<i32>
      %8 = stablehlo.add %iterArg_0, %7 : tensor<i32>
      stablehlo.return %4, %8, %6 : !stablehlo.token, tensor<i32>, tensor<f32>
    }
    %3 = stablehlo.constant dense<> : tensor<0xi1>
    return %3, %2#2 : tensor<0xi1>, tensor<f32>
  }
}
```

PiperOrigin-RevId: 534926215

											
										
										
											2023-05-24 11:47:58 -07:00
+								class CallTfOrderedEffect(effects.Effect):
 								  __str__ = lambda _: "CallTfOrderedEffect"
 								call_tf_ordered_effect = CallTfOrderedEffect()
 								effects.lowerable_effects.add_type(CallTfOrderedEffect)
 								effects.control_flow_allowed_effects.add_type(CallTfOrderedEffect)
 								effects.remat_allowed_effects.add_type(CallTfOrderedEffect)
 								effects.custom_derivatives_allowed_effects.add_type(CallTfOrderedEffect)
 								effects.ordered_effects.add_type(CallTfOrderedEffect)
-												Add support for shardable ordered effects to `jax2tf.call_tf`

PiperOrigin-RevId: 566361705

											
										
										
											2023-09-18 11:23:49 -07:00
+								effects.shardable_ordered_effects.add_type(CallTfOrderedEffect)
-												Add (optional) ordered effects for `jax2tf.call_tf`

This allows users to express nested TensorFlow computation that must be ordered during execution. It leverages the existing JAX effects system to model such side effects and lower them to use XLA tokens.

With this change, `jax2tf.call_tf(ordered=True)` can be used to generate ordered TF calls. This has the following behavior:

* With `call_tf_graph=True`, this generates a custom call op with the following differences: (1) a `!stablehlo.token` argument/result is prepended to each custom call's argument/result list and (2) `tf.backend_config` has an additional `has_token_input_output = true` entry.
* Without `call_tf_graph=True`, this raises a `NotImplementedError()`.

For this, `jax_export.py` makes sure that dummy arguments/results added for ordered effects are not exposed to the public interface by passing constant values in a wrapper function. Because of this, adding ordered effects to jax2tf-ed computation no longer causes calling convention changes and can be safely allowed.

Example StableHLO produced from the added test:

```
module @jit_f_jax attributes {mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
  func.func public @main(%arg0: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.constant dense<> : tensor<0xi1>
    %1:2 = call @_wrapped_jax_export_main(%0, %arg0) : (tensor<0xi1>, tensor<f32>) -> (tensor<0xi1>, tensor<f32>)
    return %1#1 : tensor<f32>
  }
  func.func private @_wrapped_jax_export_main(%arg0: tensor<0xi1> {jax.token = true}, %arg1: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<0xi1> {jax.token = true}, tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.create_token : !stablehlo.token
    %1 = stablehlo.constant dense<0> : tensor<i32>
    %2:3 = stablehlo.while(%iterArg = %0, %iterArg_0 = %1, %iterArg_1 = %arg1) : !stablehlo.token, tensor<i32>, tensor<f32>
     cond {
      %4 = stablehlo.constant dense<4> : tensor<i32>
      %5 = stablehlo.compare  LT, %iterArg_0, %4,  SIGNED : (tensor<i32>, tensor<i32>) -> tensor<i1>
      stablehlo.return %5 : tensor<i1>
    } do {
      %4 = stablehlo.custom_call @tf.call_tf_function(%iterArg, %iterArg_1) {api_version = 2 : i32, has_side_effect = true, tf.backend_config = {caller_name = "__inference_callable_flat_tf_10", has_token_input_output = true}} : (!stablehlo.token, tensor<f32>) -> !stablehlo.token
      %5 = stablehlo.constant dense<1.000000e+00> : tensor<f32>
      %6 = stablehlo.add %iterArg_1, %5 : tensor<f32>
      %7 = stablehlo.constant dense<1> : tensor<i32>
      %8 = stablehlo.add %iterArg_0, %7 : tensor<i32>
      stablehlo.return %4, %8, %6 : !stablehlo.token, tensor<i32>, tensor<f32>
    }
    %3 = stablehlo.constant dense<> : tensor<0xi1>
    return %3, %2#2 : tensor<0xi1>, tensor<f32>
  }
}
```

PiperOrigin-RevId: 534926215

											
										
										
											2023-05-24 11:47:58 -07:00
-												[2/n] Embed the tf.Graph into the stablehlo.custom_call.

PiperOrigin-RevId: 527302563

											
										
										
											2023-04-26 10:20:12 -07:00
+								def _call_tf_abstract_eval(
 								    *args_flat_avals,
 								    function_flat_tf,
 								    args_flat_sig_tf,
 								    has_side_effects,
-												Add (optional) ordered effects for `jax2tf.call_tf`

This allows users to express nested TensorFlow computation that must be ordered during execution. It leverages the existing JAX effects system to model such side effects and lower them to use XLA tokens.

With this change, `jax2tf.call_tf(ordered=True)` can be used to generate ordered TF calls. This has the following behavior:

* With `call_tf_graph=True`, this generates a custom call op with the following differences: (1) a `!stablehlo.token` argument/result is prepended to each custom call's argument/result list and (2) `tf.backend_config` has an additional `has_token_input_output = true` entry.
* Without `call_tf_graph=True`, this raises a `NotImplementedError()`.

For this, `jax_export.py` makes sure that dummy arguments/results added for ordered effects are not exposed to the public interface by passing constant values in a wrapper function. Because of this, adding ordered effects to jax2tf-ed computation no longer causes calling convention changes and can be safely allowed.

Example StableHLO produced from the added test:

```
module @jit_f_jax attributes {mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
  func.func public @main(%arg0: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.constant dense<> : tensor<0xi1>
    %1:2 = call @_wrapped_jax_export_main(%0, %arg0) : (tensor<0xi1>, tensor<f32>) -> (tensor<0xi1>, tensor<f32>)
    return %1#1 : tensor<f32>
  }
  func.func private @_wrapped_jax_export_main(%arg0: tensor<0xi1> {jax.token = true}, %arg1: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<0xi1> {jax.token = true}, tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.create_token : !stablehlo.token
    %1 = stablehlo.constant dense<0> : tensor<i32>
    %2:3 = stablehlo.while(%iterArg = %0, %iterArg_0 = %1, %iterArg_1 = %arg1) : !stablehlo.token, tensor<i32>, tensor<f32>
     cond {
      %4 = stablehlo.constant dense<4> : tensor<i32>
      %5 = stablehlo.compare  LT, %iterArg_0, %4,  SIGNED : (tensor<i32>, tensor<i32>) -> tensor<i1>
      stablehlo.return %5 : tensor<i1>
    } do {
      %4 = stablehlo.custom_call @tf.call_tf_function(%iterArg, %iterArg_1) {api_version = 2 : i32, has_side_effect = true, tf.backend_config = {caller_name = "__inference_callable_flat_tf_10", has_token_input_output = true}} : (!stablehlo.token, tensor<f32>) -> !stablehlo.token
      %5 = stablehlo.constant dense<1.000000e+00> : tensor<f32>
      %6 = stablehlo.add %iterArg_1, %5 : tensor<f32>
      %7 = stablehlo.constant dense<1> : tensor<i32>
      %8 = stablehlo.add %iterArg_0, %7 : tensor<i32>
      stablehlo.return %4, %8, %6 : !stablehlo.token, tensor<i32>, tensor<f32>
    }
    %3 = stablehlo.constant dense<> : tensor<0xi1>
    return %3, %2#2 : tensor<0xi1>, tensor<f32>
  }
}
```

PiperOrigin-RevId: 534926215

											
										
										
											2023-05-24 11:47:58 -07:00
+								    ordered,
-												[2/n] Embed the tf.Graph into the stablehlo.custom_call.

PiperOrigin-RevId: 527302563

											
										
										
											2023-04-26 10:20:12 -07:00
+								    output_avals,
-												Bump XLACallModule to version 5 and add the function_list.

PiperOrigin-RevId: 529106145

											
										
										
											2023-05-03 09:04:01 -07:00
+								    call_tf_graph,
-												Add (optional) ordered effects for `jax2tf.call_tf`

This allows users to express nested TensorFlow computation that must be ordered during execution. It leverages the existing JAX effects system to model such side effects and lower them to use XLA tokens.

With this change, `jax2tf.call_tf(ordered=True)` can be used to generate ordered TF calls. This has the following behavior:

* With `call_tf_graph=True`, this generates a custom call op with the following differences: (1) a `!stablehlo.token` argument/result is prepended to each custom call's argument/result list and (2) `tf.backend_config` has an additional `has_token_input_output = true` entry.
* Without `call_tf_graph=True`, this raises a `NotImplementedError()`.

For this, `jax_export.py` makes sure that dummy arguments/results added for ordered effects are not exposed to the public interface by passing constant values in a wrapper function. Because of this, adding ordered effects to jax2tf-ed computation no longer causes calling convention changes and can be safely allowed.

Example StableHLO produced from the added test:

```
module @jit_f_jax attributes {mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
  func.func public @main(%arg0: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.constant dense<> : tensor<0xi1>
    %1:2 = call @_wrapped_jax_export_main(%0, %arg0) : (tensor<0xi1>, tensor<f32>) -> (tensor<0xi1>, tensor<f32>)
    return %1#1 : tensor<f32>
  }
  func.func private @_wrapped_jax_export_main(%arg0: tensor<0xi1> {jax.token = true}, %arg1: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<0xi1> {jax.token = true}, tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.create_token : !stablehlo.token
    %1 = stablehlo.constant dense<0> : tensor<i32>
    %2:3 = stablehlo.while(%iterArg = %0, %iterArg_0 = %1, %iterArg_1 = %arg1) : !stablehlo.token, tensor<i32>, tensor<f32>
     cond {
      %4 = stablehlo.constant dense<4> : tensor<i32>
      %5 = stablehlo.compare  LT, %iterArg_0, %4,  SIGNED : (tensor<i32>, tensor<i32>) -> tensor<i1>
      stablehlo.return %5 : tensor<i1>
    } do {
      %4 = stablehlo.custom_call @tf.call_tf_function(%iterArg, %iterArg_1) {api_version = 2 : i32, has_side_effect = true, tf.backend_config = {caller_name = "__inference_callable_flat_tf_10", has_token_input_output = true}} : (!stablehlo.token, tensor<f32>) -> !stablehlo.token
      %5 = stablehlo.constant dense<1.000000e+00> : tensor<f32>
      %6 = stablehlo.add %iterArg_1, %5 : tensor<f32>
      %7 = stablehlo.constant dense<1> : tensor<i32>
      %8 = stablehlo.add %iterArg_0, %7 : tensor<i32>
      stablehlo.return %4, %8, %6 : !stablehlo.token, tensor<i32>, tensor<f32>
    }
    %3 = stablehlo.constant dense<> : tensor<0xi1>
    return %3, %2#2 : tensor<0xi1>, tensor<f32>
  }
}
```

PiperOrigin-RevId: 534926215

											
										
										
											2023-05-24 11:47:58 -07:00
+								    **__,
 								):
-												[call_tf] Use the same platform for TF lowering as the embedding JAX computation

This requires some changes for abstract evaluation, when
JAX does not use a specific platform.

Also attempt to fix the case when the TF lowering fails because the TF computation
uses a tf.Variable on another device as that used for lowering.

PiperOrigin-RevId: 492112847

											
										
										
											2022-11-30 23:21:55 -08:00
+								  # Called only when we form a Jaxpr, i.e., under jit, scan, etc.
-												Add (optional) ordered effects for `jax2tf.call_tf`

This allows users to express nested TensorFlow computation that must be ordered during execution. It leverages the existing JAX effects system to model such side effects and lower them to use XLA tokens.

With this change, `jax2tf.call_tf(ordered=True)` can be used to generate ordered TF calls. This has the following behavior:

* With `call_tf_graph=True`, this generates a custom call op with the following differences: (1) a `!stablehlo.token` argument/result is prepended to each custom call's argument/result list and (2) `tf.backend_config` has an additional `has_token_input_output = true` entry.
* Without `call_tf_graph=True`, this raises a `NotImplementedError()`.

For this, `jax_export.py` makes sure that dummy arguments/results added for ordered effects are not exposed to the public interface by passing constant values in a wrapper function. Because of this, adding ordered effects to jax2tf-ed computation no longer causes calling convention changes and can be safely allowed.

Example StableHLO produced from the added test:

```
module @jit_f_jax attributes {mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
  func.func public @main(%arg0: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.constant dense<> : tensor<0xi1>
    %1:2 = call @_wrapped_jax_export_main(%0, %arg0) : (tensor<0xi1>, tensor<f32>) -> (tensor<0xi1>, tensor<f32>)
    return %1#1 : tensor<f32>
  }
  func.func private @_wrapped_jax_export_main(%arg0: tensor<0xi1> {jax.token = true}, %arg1: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<0xi1> {jax.token = true}, tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.create_token : !stablehlo.token
    %1 = stablehlo.constant dense<0> : tensor<i32>
    %2:3 = stablehlo.while(%iterArg = %0, %iterArg_0 = %1, %iterArg_1 = %arg1) : !stablehlo.token, tensor<i32>, tensor<f32>
     cond {
      %4 = stablehlo.constant dense<4> : tensor<i32>
      %5 = stablehlo.compare  LT, %iterArg_0, %4,  SIGNED : (tensor<i32>, tensor<i32>) -> tensor<i1>
      stablehlo.return %5 : tensor<i1>
    } do {
      %4 = stablehlo.custom_call @tf.call_tf_function(%iterArg, %iterArg_1) {api_version = 2 : i32, has_side_effect = true, tf.backend_config = {caller_name = "__inference_callable_flat_tf_10", has_token_input_output = true}} : (!stablehlo.token, tensor<f32>) -> !stablehlo.token
      %5 = stablehlo.constant dense<1.000000e+00> : tensor<f32>
      %6 = stablehlo.add %iterArg_1, %5 : tensor<f32>
      %7 = stablehlo.constant dense<1> : tensor<i32>
      %8 = stablehlo.add %iterArg_0, %7 : tensor<i32>
      stablehlo.return %4, %8, %6 : !stablehlo.token, tensor<i32>, tensor<f32>
    }
    %3 = stablehlo.constant dense<> : tensor<0xi1>
    return %3, %2#2 : tensor<0xi1>, tensor<f32>
  }
}
```

PiperOrigin-RevId: 534926215

											
										
										
											2023-05-24 11:47:58 -07:00
+								  effects = set()
 								  if ordered:
 								    effects.add(call_tf_ordered_effect)
 								  elif has_side_effects:
 								    effects.add(call_tf_effect)
-												[call_tf] Use the same platform for TF lowering as the embedding JAX computation

This requires some changes for abstract evaluation, when
JAX does not use a specific platform.

Also attempt to fix the case when the TF lowering fails because the TF computation
uses a tf.Variable on another device as that used for lowering.

PiperOrigin-RevId: 492112847

											
										
										
											2022-11-30 23:21:55 -08:00
-												[call_tf] Some cleanup of call_tf

The main cleanup is around _code_generator_and_avals, which in
an earlier version of the code was used for both abstract values
and for code generation. That is why it was cached, and why it
returned a code generator and abstract values. A while
ago we did a first round of cleaning to not use it for abstract
values. Now we can actually eliminate the function and inline
it directly.

A second improvement is to add the explicit error message from
TF commpilation, instead of just the generic message that
call_tf cannot be used with non-compileable functions.

											
										
										
											2023-04-27 13:42:23 +02:00
+								  # If no output_avals is given, then we ask TF to infer the output shapes.
-												[shape_poly, call_tf] Some improvements for call_tf in a shape polymorphic program

This is another attempt to land a rolled-back change https://github.com/google/jax/pull/14734 (cl/514070997).
See b/272154366 for more details.

The use case for call_tf with shape polymorphism is when we have a JAX program
that calls into TF function, and we want to serialize the JAX program with
some shapes unknown. Previously this use case did not work, except in the special
case when the output shape of the called TF function returns statically known
shapes.

The idea is that we allow the user of call_tf to specify the output shape.
This can be done even in presence of shape polymorphism, by writing the
output shape as an expression in terms of the input shapes. This is what
other JAX primitives do, e.g., concat, so we are simply enabling call_tf
to get the same behavior.

This change should be enough for old-style jax2tf, but will require more
work for native serialization.

We also removed some old code that was trying to workaround some limitations
in shape inference in TF. I think that those workarounds are ugly, and I am
prepared to give error messages rather than keep that code. So far no
tests fail.

PiperOrigin-RevId: 515137407

											
										
										
											2023-03-08 14:09:35 -08:00
+								  # We call this even if output_avals is given because it will ensure that
 								  # callable_flat_tf is called. Since _get_concrete_function_tf is cached
 								  # there is a small cost of calling it more often than needed.
-												[call_tf] Use the same platform for TF lowering as the embedding JAX computation

This requires some changes for abstract evaluation, when
JAX does not use a specific platform.

Also attempt to fix the case when the TF lowering fails because the TF computation
uses a tf.Variable on another device as that used for lowering.

PiperOrigin-RevId: 492112847

											
										
										
											2022-11-30 23:21:55 -08:00
+								  concrete_function_flat_tf = _get_concrete_function_tf(function_flat_tf,
 								                                                        args_flat_sig_tf)
-												Consolidate the code path for both `call_tf_graph=True` or `call_tf_graph=False`.

PiperOrigin-RevId: 552605585

											
										
										
											2023-07-31 15:17:48 -07:00
 								  # In the case that the tf.function has no return value
-												[2/n] Embed the tf.Graph into the stablehlo.custom_call.

PiperOrigin-RevId: 527302563

											
										
										
											2023-04-26 10:20:12 -07:00
+								  if len(concrete_function_flat_tf.outputs) == 0:
-												ENH Use {} and () instead of dict() and tuple()

											
										
										
											2023-09-22 09:05:42 +01:00
+								    return (), effects
-												[2/n] Embed the tf.Graph into the stablehlo.custom_call.

PiperOrigin-RevId: 527302563

											
										
										
											2023-04-26 10:20:12 -07:00
-												[shape_poly, call_tf] Some improvements for call_tf in a shape polymorphic program

This is another attempt to land a rolled-back change https://github.com/google/jax/pull/14734 (cl/514070997).
See b/272154366 for more details.

The use case for call_tf with shape polymorphism is when we have a JAX program
that calls into TF function, and we want to serialize the JAX program with
some shapes unknown. Previously this use case did not work, except in the special
case when the output shape of the called TF function returns statically known
shapes.

The idea is that we allow the user of call_tf to specify the output shape.
This can be done even in presence of shape polymorphism, by writing the
output shape as an expression in terms of the input shapes. This is what
other JAX primitives do, e.g., concat, so we are simply enabling call_tf
to get the same behavior.

This change should be enough for old-style jax2tf, but will require more
work for native serialization.

We also removed some old code that was trying to workaround some limitations
in shape inference in TF. I think that those workarounds are ugly, and I am
prepared to give error messages rather than keep that code. So far no
tests fail.

PiperOrigin-RevId: 515137407

											
										
										
											2023-03-08 14:09:35 -08:00
+								  if output_avals is not None:
 								    return output_avals, effects
-												[call_tf] Use the same platform for TF lowering as the embedding JAX computation

This requires some changes for abstract evaluation, when
JAX does not use a specific platform.

Also attempt to fix the case when the TF lowering fails because the TF computation
uses a tf.Variable on another device as that used for lowering.

PiperOrigin-RevId: 492112847

											
										
										
											2022-11-30 23:21:55 -08:00
+								  def is_fully_known_shape(s):
-												MAINT Use a generator expression with `all()` and `any()`

There is no reason to allocate a list only for the purpose of iteration.

											
										
										
											2023-10-10 22:33:03 +01:00
+								    return s.rank is not None and all(d is not None for d in s)
-												[shape_poly, call_tf] Some improvements for call_tf in a shape polymorphic program

This is another attempt to land a rolled-back change https://github.com/google/jax/pull/14734 (cl/514070997).
See b/272154366 for more details.

The use case for call_tf with shape polymorphism is when we have a JAX program
that calls into TF function, and we want to serialize the JAX program with
some shapes unknown. Previously this use case did not work, except in the special
case when the output shape of the called TF function returns statically known
shapes.

The idea is that we allow the user of call_tf to specify the output shape.
This can be done even in presence of shape polymorphism, by writing the
output shape as an expression in terms of the input shapes. This is what
other JAX primitives do, e.g., concat, so we are simply enabling call_tf
to get the same behavior.

This change should be enough for old-style jax2tf, but will require more
work for native serialization.

We also removed some old code that was trying to workaround some limitations
in shape inference in TF. I think that those workarounds are ugly, and I am
prepared to give error messages rather than keep that code. So far no
tests fail.

PiperOrigin-RevId: 515137407

											
										
										
											2023-03-08 14:09:35 -08:00
 								  if all(is_fully_known_shape(s)
 								        for s in concrete_function_flat_tf.output_shapes):
 								    avals_from_tf = tuple(
 								        # We convert to JAX type, and canonicalize to 32-bit if necessary
 								        core.ShapedArray(shape, jax2tf_internal._to_jax_dtype(dtype))
 								        for dtype, shape in zip(concrete_function_flat_tf.output_dtypes,
 								                                concrete_function_flat_tf.output_shapes))
 								    return avals_from_tf, effects
 								  msg = ("call_tf cannot call functions whose output has dynamic shape. "
 								    f"Found output shapes: {concrete_function_flat_tf.output_shapes}. "
 								    "Consider using the `output_shape_dtype` argument to call_tf. "
-												Update references to the GitHub url in JAX codebase to reflect move from google/jax to jax-ml/jax

PiperOrigin-RevId: 676843138

											
										
										
											2024-09-20 07:51:48 -07:00
+								    "\nSee https://github.com/jax-ml/jax/blob/main/jax/experimental/jax2tf/README.md#limitations-of-call_tf"
-												[shape_poly, call_tf] Some improvements for call_tf in a shape polymorphic program

This is another attempt to land a rolled-back change https://github.com/google/jax/pull/14734 (cl/514070997).
See b/272154366 for more details.

The use case for call_tf with shape polymorphism is when we have a JAX program
that calls into TF function, and we want to serialize the JAX program with
some shapes unknown. Previously this use case did not work, except in the special
case when the output shape of the called TF function returns statically known
shapes.

The idea is that we allow the user of call_tf to specify the output shape.
This can be done even in presence of shape polymorphism, by writing the
output shape as an expression in terms of the input shapes. This is what
other JAX primitives do, e.g., concat, so we are simply enabling call_tf
to get the same behavior.

This change should be enough for old-style jax2tf, but will require more
work for native serialization.

We also removed some old code that was trying to workaround some limitations
in shape inference in TF. I think that those workarounds are ugly, and I am
prepared to give error messages rather than keep that code. So far no
tests fail.

PiperOrigin-RevId: 515137407

											
										
										
											2023-03-08 14:09:35 -08:00
+								      " for a discussion.")
 								  raise ValueError(msg)
-												[call_tf] Use the same platform for TF lowering as the embedding JAX computation

This requires some changes for abstract evaluation, when
JAX does not use a specific platform.

Also attempt to fix the case when the TF lowering fails because the TF computation
uses a tf.Variable on another device as that used for lowering.

PiperOrigin-RevId: 492112847

											
										
										
											2022-11-30 23:21:55 -08:00
-												[2/n] Embed the tf.Graph into the stablehlo.custom_call.

PiperOrigin-RevId: 527302563

											
										
										
											2023-04-26 10:20:12 -07:00
-												Make `call_tf`'s abstract eval rule effectful so that JAX's DCE pass doesn't prune the arguments passed to it.

PiperOrigin-RevId: 496022997

											
										
										
											2022-12-16 20:42:19 -08:00
+								call_tf_p.def_effectful_abstract_eval(_call_tf_abstract_eval)
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
-												[1/n] store embedded tf.graph to stablehlo.custom_call

PiperOrigin-RevId: 519194911

											
										
										
											2023-03-24 11:26:44 -07:00
+								def _call_tf_lowering(
-												[call_tf] Some cleanup of call_tf

The main cleanup is around _code_generator_and_avals, which in
an earlier version of the code was used for both abstract values
and for code generation. That is why it was cached, and why it
returned a code generator and abstract values. A while
ago we did a first round of cleaning to not use it for abstract
values. Now we can actually eliminate the function and inline
it directly.

A second improvement is to add the explicit error message from
TF commpilation, instead of just the generic message that
call_tf cannot be used with non-compileable functions.

											
										
										
											2023-04-27 13:42:23 +02:00
+								    ctx: mlir.LoweringRuleContext,
-												[1/n] store embedded tf.graph to stablehlo.custom_call

PiperOrigin-RevId: 519194911

											
										
										
											2023-03-24 11:26:44 -07:00
+								    *args_op,
 								    platform,
 								    function_flat_tf,
 								    args_flat_sig_tf,
 								    has_side_effects,
-												Add (optional) ordered effects for `jax2tf.call_tf`

This allows users to express nested TensorFlow computation that must be ordered during execution. It leverages the existing JAX effects system to model such side effects and lower them to use XLA tokens.

With this change, `jax2tf.call_tf(ordered=True)` can be used to generate ordered TF calls. This has the following behavior:

* With `call_tf_graph=True`, this generates a custom call op with the following differences: (1) a `!stablehlo.token` argument/result is prepended to each custom call's argument/result list and (2) `tf.backend_config` has an additional `has_token_input_output = true` entry.
* Without `call_tf_graph=True`, this raises a `NotImplementedError()`.

For this, `jax_export.py` makes sure that dummy arguments/results added for ordered effects are not exposed to the public interface by passing constant values in a wrapper function. Because of this, adding ordered effects to jax2tf-ed computation no longer causes calling convention changes and can be safely allowed.

Example StableHLO produced from the added test:

```
module @jit_f_jax attributes {mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
  func.func public @main(%arg0: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.constant dense<> : tensor<0xi1>
    %1:2 = call @_wrapped_jax_export_main(%0, %arg0) : (tensor<0xi1>, tensor<f32>) -> (tensor<0xi1>, tensor<f32>)
    return %1#1 : tensor<f32>
  }
  func.func private @_wrapped_jax_export_main(%arg0: tensor<0xi1> {jax.token = true}, %arg1: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<0xi1> {jax.token = true}, tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.create_token : !stablehlo.token
    %1 = stablehlo.constant dense<0> : tensor<i32>
    %2:3 = stablehlo.while(%iterArg = %0, %iterArg_0 = %1, %iterArg_1 = %arg1) : !stablehlo.token, tensor<i32>, tensor<f32>
     cond {
      %4 = stablehlo.constant dense<4> : tensor<i32>
      %5 = stablehlo.compare  LT, %iterArg_0, %4,  SIGNED : (tensor<i32>, tensor<i32>) -> tensor<i1>
      stablehlo.return %5 : tensor<i1>
    } do {
      %4 = stablehlo.custom_call @tf.call_tf_function(%iterArg, %iterArg_1) {api_version = 2 : i32, has_side_effect = true, tf.backend_config = {caller_name = "__inference_callable_flat_tf_10", has_token_input_output = true}} : (!stablehlo.token, tensor<f32>) -> !stablehlo.token
      %5 = stablehlo.constant dense<1.000000e+00> : tensor<f32>
      %6 = stablehlo.add %iterArg_1, %5 : tensor<f32>
      %7 = stablehlo.constant dense<1> : tensor<i32>
      %8 = stablehlo.add %iterArg_0, %7 : tensor<i32>
      stablehlo.return %4, %8, %6 : !stablehlo.token, tensor<i32>, tensor<f32>
    }
    %3 = stablehlo.constant dense<> : tensor<0xi1>
    return %3, %2#2 : tensor<0xi1>, tensor<f32>
  }
}
```

PiperOrigin-RevId: 534926215

											
										
										
											2023-05-24 11:47:58 -07:00
+								    ordered,
-												Bump XLACallModule to version 5 and add the function_list.

PiperOrigin-RevId: 529106145

											
										
										
											2023-05-03 09:04:01 -07:00
+								    call_tf_graph,
-												[1/n] store embedded tf.graph to stablehlo.custom_call

PiperOrigin-RevId: 519194911

											
										
										
											2023-03-24 11:26:44 -07:00
+								    output_avals,
-												Add (optional) ordered effects for `jax2tf.call_tf`

This allows users to express nested TensorFlow computation that must be ordered during execution. It leverages the existing JAX effects system to model such side effects and lower them to use XLA tokens.

With this change, `jax2tf.call_tf(ordered=True)` can be used to generate ordered TF calls. This has the following behavior:

* With `call_tf_graph=True`, this generates a custom call op with the following differences: (1) a `!stablehlo.token` argument/result is prepended to each custom call's argument/result list and (2) `tf.backend_config` has an additional `has_token_input_output = true` entry.
* Without `call_tf_graph=True`, this raises a `NotImplementedError()`.

For this, `jax_export.py` makes sure that dummy arguments/results added for ordered effects are not exposed to the public interface by passing constant values in a wrapper function. Because of this, adding ordered effects to jax2tf-ed computation no longer causes calling convention changes and can be safely allowed.

Example StableHLO produced from the added test:

```
module @jit_f_jax attributes {mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
  func.func public @main(%arg0: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.constant dense<> : tensor<0xi1>
    %1:2 = call @_wrapped_jax_export_main(%0, %arg0) : (tensor<0xi1>, tensor<f32>) -> (tensor<0xi1>, tensor<f32>)
    return %1#1 : tensor<f32>
  }
  func.func private @_wrapped_jax_export_main(%arg0: tensor<0xi1> {jax.token = true}, %arg1: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<0xi1> {jax.token = true}, tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.create_token : !stablehlo.token
    %1 = stablehlo.constant dense<0> : tensor<i32>
    %2:3 = stablehlo.while(%iterArg = %0, %iterArg_0 = %1, %iterArg_1 = %arg1) : !stablehlo.token, tensor<i32>, tensor<f32>
     cond {
      %4 = stablehlo.constant dense<4> : tensor<i32>
      %5 = stablehlo.compare  LT, %iterArg_0, %4,  SIGNED : (tensor<i32>, tensor<i32>) -> tensor<i1>
      stablehlo.return %5 : tensor<i1>
    } do {
      %4 = stablehlo.custom_call @tf.call_tf_function(%iterArg, %iterArg_1) {api_version = 2 : i32, has_side_effect = true, tf.backend_config = {caller_name = "__inference_callable_flat_tf_10", has_token_input_output = true}} : (!stablehlo.token, tensor<f32>) -> !stablehlo.token
      %5 = stablehlo.constant dense<1.000000e+00> : tensor<f32>
      %6 = stablehlo.add %iterArg_1, %5 : tensor<f32>
      %7 = stablehlo.constant dense<1> : tensor<i32>
      %8 = stablehlo.add %iterArg_0, %7 : tensor<i32>
      stablehlo.return %4, %8, %6 : !stablehlo.token, tensor<i32>, tensor<f32>
    }
    %3 = stablehlo.constant dense<> : tensor<0xi1>
    return %3, %2#2 : tensor<0xi1>, tensor<f32>
  }
}
```

PiperOrigin-RevId: 534926215

											
										
										
											2023-05-24 11:47:58 -07:00
+								    **_,
 								):
-												[call_tf] Use the same platform for TF lowering as the embedding JAX computation

This requires some changes for abstract evaluation, when
JAX does not use a specific platform.

Also attempt to fix the case when the TF lowering fails because the TF computation
uses a tf.Variable on another device as that used for lowering.

PiperOrigin-RevId: 492112847

											
										
										
											2022-11-30 23:21:55 -08:00
+								  # We use the same TF lowering device as for the embedding JAX computation.
 								  # One example when this is needed is when the code refers to variables on one
 								  # device. Or, for sharding annotations (only supported on TPU).
-												[2/n] Embed the tf.Graph into the stablehlo.custom_call.

PiperOrigin-RevId: 527302563

											
										
										
											2023-04-26 10:20:12 -07:00
-												[call_tf] Use the same platform for TF lowering as the embedding JAX computation

This requires some changes for abstract evaluation, when
JAX does not use a specific platform.

Also attempt to fix the case when the TF lowering fails because the TF computation
uses a tf.Variable on another device as that used for lowering.

PiperOrigin-RevId: 492112847

											
										
										
											2022-11-30 23:21:55 -08:00
+								  if platform in ["cpu", "tpu"]:
 								    tf_platform = platform.upper()
 								  elif platform == "cuda":
 								    tf_platform = "GPU"
 								  else:
 								    raise ValueError("platform {platform} not supported")
-												[jax2tf] Improved error checking for call_tf.

Cleaned up the abstract evaluation for call_tf to
work around a bug in TF whereby experimental_get_compiler_ir
cannot be used in a tf.function context.

Added more error messages, e.g., for the case when
the TF function has shape-influencing inputs.

											
										
										
											2021-07-10 18:49:25 +03:00
-												[call_tf] Use the same platform for TF lowering as the embedding JAX computation

This requires some changes for abstract evaluation, when
JAX does not use a specific platform.

Also attempt to fix the case when the TF lowering fails because the TF computation
uses a tf.Variable on another device as that used for lowering.

PiperOrigin-RevId: 492112847

											
										
										
											2022-11-30 23:21:55 -08:00
+								  concrete_function_flat_tf = _get_concrete_function_tf(function_flat_tf, args_flat_sig_tf)
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
-												[jax2tf] Improved error checking for call_tf.

Cleaned up the abstract evaluation for call_tf to
work around a bug in TF whereby experimental_get_compiler_ir
cannot be used in a tf.function context.

Added more error messages, e.g., for the case when
the TF function has shape-influencing inputs.

											
										
										
											2021-07-10 18:49:25 +03:00
+								  captured_inputs = []
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
+								  if concrete_function_flat_tf.captured_inputs:
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
+								    # The function uses either captured variables or tensors.
 								    msg = (
-												[jax2tf] Improved error checking for call_tf.

Cleaned up the abstract evaluation for call_tf to
work around a bug in TF whereby experimental_get_compiler_ir
cannot be used in a tf.function context.

Added more error messages, e.g., for the case when
the TF function has shape-influencing inputs.

											
										
										
											2021-07-10 18:49:25 +03:00
+								        "call_tf works best with a TensorFlow function that does not capture "
 								        "variables or tensors from the context. "
-												Update references to the GitHub url in JAX codebase to reflect move from google/jax to jax-ml/jax

PiperOrigin-RevId: 676843138

											
										
										
											2024-09-20 07:51:48 -07:00
+								        "See https://github.com/jax-ml/jax/blob/main/jax/experimental/jax2tf/README.md#limitations-of-call_tf for a discussion. "
-												[jax2tf] Improved error checking for call_tf.

Cleaned up the abstract evaluation for call_tf to
work around a bug in TF whereby experimental_get_compiler_ir
cannot be used in a tf.function context.

Added more error messages, e.g., for the case when
the TF function has shape-influencing inputs.

											
										
										
											2021-07-10 18:49:25 +03:00
+								        f"The following captures were found {concrete_function_flat_tf.captured_inputs}")
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
+								    logging.warning(msg)
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
+								    for inp in concrete_function_flat_tf.captured_inputs:
-												[call_tf] Fix bug when calling TF functions with variables in a jit context.

The code was assuming that the `.captured_inputs` of a function are
variables in the same order as `.variables`. This seems to not be
true. Lookup variables now by handle.

											
										
										
											2021-09-14 14:15:40 +02:00
+								      if inp.dtype == tf.resource:  # A variable; lookup by handle
 								        inp_vars = [v for v in concrete_function_flat_tf.variables if inp is v.handle]
 								        assert len(inp_vars) == 1, f"Found {inp_vars}"
 								        captured_inputs.append(inp_vars[0])
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
+								      else:
-												[jax2tf] Improved error checking for call_tf.

Cleaned up the abstract evaluation for call_tf to
work around a bug in TF whereby experimental_get_compiler_ir
cannot be used in a tf.function context.

Added more error messages, e.g., for the case when
the TF function has shape-influencing inputs.

											
										
										
											2021-07-10 18:49:25 +03:00
+								        captured_inputs.append(inp)
-												[call_tf] Fixed the handling of x64 values in JAX_ENABLE_X64=False

TensorFlow interprets Python scalars in x64 mode, or it may contain
explicit x64 computation. When used with call_tf, we canonicalize
inputs and outputs using the JAX rules.

											
										
										
											2021-06-16 13:25:56 +03:00
-												[jax2tf] Fixes a bad interaction between jax2tf.convert, TF, and call_tf.

Consider the use case when we call_tf a restored saved model that
includes parameters (hence functions closing over tf.Variable), and then
we jax2tf.convert it with native serialization, under tf.function (or
for saving to saved model).

The lowering for call_tf in presence of functions with captured inputs
requires looking up the tf.Variable and reading its value. This fails
with an error that `v.numpy()` is not allowd in graph mode. The fix
is to use `tf.init_scope()` to lift out of graph building mode, so that
we can read the value of the variables.

											
										
										
											2024-10-24 10:12:54 +02:00
+								  # The following use case happens when we call_tf a restored saved model that
 								  # includes parameters (hence functions closing over tf.Variable), and then
 								  # we jax2tf.convert it with native serialization, under tf.function (or
 								  # for saving to saved model). The `np.asarray(inp)` fails because it thinks
 								  # it is in TF graph mode. The `tf.init_scope()` lifts out of function-building
 								  # graph scopes, and allows us to read the values of the variables
 								  with tf.init_scope():
 								    captured_ops = tuple(
 								        mlir.ir_constant(np.asarray(inp))
 								        for inp in captured_inputs
 								    )
-												[call_tf] Some cleanup of call_tf

The main cleanup is around _code_generator_and_avals, which in
an earlier version of the code was used for both abstract values
and for code generation. That is why it was cached, and why it
returned a code generator and abstract values. A while
ago we did a first round of cleaning to not use it for abstract
values. Now we can actually eliminate the function and inline
it directly.

A second improvement is to add the explicit error message from
TF commpilation, instead of just the generic message that
call_tf cannot be used with non-compileable functions.

											
										
										
											2023-04-27 13:42:23 +02:00
-												Bump XLACallModule to version 5 and add the function_list.

PiperOrigin-RevId: 529106145

											
										
										
											2023-05-03 09:04:01 -07:00
+								  if call_tf_graph:
-												[1/n] store embedded tf.graph to stablehlo.custom_call

PiperOrigin-RevId: 519194911

											
										
										
											2023-03-24 11:26:44 -07:00
+								    with jax2tf_internal.inside_call_tf():
 								      return emit_tf_embedded_graph_custom_call(
-												Add (optional) ordered effects for `jax2tf.call_tf`

This allows users to express nested TensorFlow computation that must be ordered during execution. It leverages the existing JAX effects system to model such side effects and lower them to use XLA tokens.

With this change, `jax2tf.call_tf(ordered=True)` can be used to generate ordered TF calls. This has the following behavior:

* With `call_tf_graph=True`, this generates a custom call op with the following differences: (1) a `!stablehlo.token` argument/result is prepended to each custom call's argument/result list and (2) `tf.backend_config` has an additional `has_token_input_output = true` entry.
* Without `call_tf_graph=True`, this raises a `NotImplementedError()`.

For this, `jax_export.py` makes sure that dummy arguments/results added for ordered effects are not exposed to the public interface by passing constant values in a wrapper function. Because of this, adding ordered effects to jax2tf-ed computation no longer causes calling convention changes and can be safely allowed.

Example StableHLO produced from the added test:

```
module @jit_f_jax attributes {mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
  func.func public @main(%arg0: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.constant dense<> : tensor<0xi1>
    %1:2 = call @_wrapped_jax_export_main(%0, %arg0) : (tensor<0xi1>, tensor<f32>) -> (tensor<0xi1>, tensor<f32>)
    return %1#1 : tensor<f32>
  }
  func.func private @_wrapped_jax_export_main(%arg0: tensor<0xi1> {jax.token = true}, %arg1: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<0xi1> {jax.token = true}, tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.create_token : !stablehlo.token
    %1 = stablehlo.constant dense<0> : tensor<i32>
    %2:3 = stablehlo.while(%iterArg = %0, %iterArg_0 = %1, %iterArg_1 = %arg1) : !stablehlo.token, tensor<i32>, tensor<f32>
     cond {
      %4 = stablehlo.constant dense<4> : tensor<i32>
      %5 = stablehlo.compare  LT, %iterArg_0, %4,  SIGNED : (tensor<i32>, tensor<i32>) -> tensor<i1>
      stablehlo.return %5 : tensor<i1>
    } do {
      %4 = stablehlo.custom_call @tf.call_tf_function(%iterArg, %iterArg_1) {api_version = 2 : i32, has_side_effect = true, tf.backend_config = {caller_name = "__inference_callable_flat_tf_10", has_token_input_output = true}} : (!stablehlo.token, tensor<f32>) -> !stablehlo.token
      %5 = stablehlo.constant dense<1.000000e+00> : tensor<f32>
      %6 = stablehlo.add %iterArg_1, %5 : tensor<f32>
      %7 = stablehlo.constant dense<1> : tensor<i32>
      %8 = stablehlo.add %iterArg_0, %7 : tensor<i32>
      stablehlo.return %4, %8, %6 : !stablehlo.token, tensor<i32>, tensor<f32>
    }
    %3 = stablehlo.constant dense<> : tensor<0xi1>
    return %3, %2#2 : tensor<0xi1>, tensor<f32>
  }
}
```

PiperOrigin-RevId: 534926215

											
										
										
											2023-05-24 11:47:58 -07:00
+								          ctx,
-												[1/n] store embedded tf.graph to stablehlo.custom_call

PiperOrigin-RevId: 519194911

											
										
										
											2023-03-24 11:26:44 -07:00
+								          concrete_function_flat_tf,
 								          tuple(args_op) + captured_ops,
 								          has_side_effects,
-												Add (optional) ordered effects for `jax2tf.call_tf`

This allows users to express nested TensorFlow computation that must be ordered during execution. It leverages the existing JAX effects system to model such side effects and lower them to use XLA tokens.

With this change, `jax2tf.call_tf(ordered=True)` can be used to generate ordered TF calls. This has the following behavior:

* With `call_tf_graph=True`, this generates a custom call op with the following differences: (1) a `!stablehlo.token` argument/result is prepended to each custom call's argument/result list and (2) `tf.backend_config` has an additional `has_token_input_output = true` entry.
* Without `call_tf_graph=True`, this raises a `NotImplementedError()`.

For this, `jax_export.py` makes sure that dummy arguments/results added for ordered effects are not exposed to the public interface by passing constant values in a wrapper function. Because of this, adding ordered effects to jax2tf-ed computation no longer causes calling convention changes and can be safely allowed.

Example StableHLO produced from the added test:

```
module @jit_f_jax attributes {mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
  func.func public @main(%arg0: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.constant dense<> : tensor<0xi1>
    %1:2 = call @_wrapped_jax_export_main(%0, %arg0) : (tensor<0xi1>, tensor<f32>) -> (tensor<0xi1>, tensor<f32>)
    return %1#1 : tensor<f32>
  }
  func.func private @_wrapped_jax_export_main(%arg0: tensor<0xi1> {jax.token = true}, %arg1: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<0xi1> {jax.token = true}, tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.create_token : !stablehlo.token
    %1 = stablehlo.constant dense<0> : tensor<i32>
    %2:3 = stablehlo.while(%iterArg = %0, %iterArg_0 = %1, %iterArg_1 = %arg1) : !stablehlo.token, tensor<i32>, tensor<f32>
     cond {
      %4 = stablehlo.constant dense<4> : tensor<i32>
      %5 = stablehlo.compare  LT, %iterArg_0, %4,  SIGNED : (tensor<i32>, tensor<i32>) -> tensor<i1>
      stablehlo.return %5 : tensor<i1>
    } do {
      %4 = stablehlo.custom_call @tf.call_tf_function(%iterArg, %iterArg_1) {api_version = 2 : i32, has_side_effect = true, tf.backend_config = {caller_name = "__inference_callable_flat_tf_10", has_token_input_output = true}} : (!stablehlo.token, tensor<f32>) -> !stablehlo.token
      %5 = stablehlo.constant dense<1.000000e+00> : tensor<f32>
      %6 = stablehlo.add %iterArg_1, %5 : tensor<f32>
      %7 = stablehlo.constant dense<1> : tensor<i32>
      %8 = stablehlo.add %iterArg_0, %7 : tensor<i32>
      stablehlo.return %4, %8, %6 : !stablehlo.token, tensor<i32>, tensor<f32>
    }
    %3 = stablehlo.constant dense<> : tensor<0xi1>
    return %3, %2#2 : tensor<0xi1>, tensor<f32>
  }
}
```

PiperOrigin-RevId: 534926215

											
										
										
											2023-05-24 11:47:58 -07:00
+								          ordered,
 								          output_avals,
 								      )
-												[1/n] store embedded tf.graph to stablehlo.custom_call

PiperOrigin-RevId: 519194911

											
										
										
											2023-03-24 11:26:44 -07:00
-												Consolidate the experimental_get_compiler_ir eager and tf function path in jax2tf.call_tf.

PiperOrigin-RevId: 506424270

											
										
										
											2023-02-01 14:30:35 -08:00
+								  def convert_to_spec(x):
 								    if isinstance(x, tf.TensorSpec):
 								      return x
 								    else:
 								      return tf.TensorSpec.from_tensor(x)
-												Change args_tf_flat to tf.TensorSpec in jax2tf.call_tf.

PiperOrigin-RevId: 502492762

											
										
										
											2023-01-16 22:42:42 -08:00
-												Consolidate the experimental_get_compiler_ir eager and tf function path in jax2tf.call_tf.

PiperOrigin-RevId: 506424270

											
										
										
											2023-02-01 14:30:35 -08:00
+								  args_tf_flat = [convert_to_spec(a) for a in args_flat_sig_tf]
-												[call_tf] Use the same platform for TF lowering as the embedding JAX computation

This requires some changes for abstract evaluation, when
JAX does not use a specific platform.

Also attempt to fix the case when the TF lowering fails because the TF computation
uses a tf.Variable on another device as that used for lowering.

PiperOrigin-RevId: 492112847

											
										
										
											2022-11-30 23:21:55 -08:00
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
+								  with jax2tf_internal.inside_call_tf():
 								    try:
-												Used `platform_name` for `call_tf`.

PiperOrigin-RevId: 599200102

											
										
										
											2024-01-17 09:33:14 -08:00
+								      func_tf_hlo = function_flat_tf.experimental_get_compiler_ir(
 								          *args_tf_flat
 								      )(stage="hlo_serialized", platform_name=tf_platform)
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
+								    except Exception as e:
-												[call_tf] Some cleanup of call_tf

The main cleanup is around _code_generator_and_avals, which in
an earlier version of the code was used for both abstract values
and for code generation. That is why it was cached, and why it
returned a code generator and abstract values. A while
ago we did a first round of cleaning to not use it for abstract
values. Now we can actually eliminate the function and inline
it directly.

A second improvement is to add the explicit error message from
TF commpilation, instead of just the generic message that
call_tf cannot be used with non-compileable functions.

											
										
										
											2023-04-27 13:42:23 +02:00
+								      msg = ("Error compiling TensorFlow function (see below for the caught exception)." +
 								             "\ncall_tf can used " +
-												[call_tf] Use the same platform for TF lowering as the embedding JAX computation

This requires some changes for abstract evaluation, when
JAX does not use a specific platform.

Also attempt to fix the case when the TF lowering fails because the TF computation
uses a tf.Variable on another device as that used for lowering.

PiperOrigin-RevId: 492112847

											
										
										
											2022-11-30 23:21:55 -08:00
+								              "in a staged context (under jax.jit, lax.scan, etc.) only with " +
-												[call_tf] Some cleanup of call_tf

The main cleanup is around _code_generator_and_avals, which in
an earlier version of the code was used for both abstract values
and for code generation. That is why it was cached, and why it
returned a code generator and abstract values. A while
ago we did a first round of cleaning to not use it for abstract
values. Now we can actually eliminate the function and inline
it directly.

A second improvement is to add the explicit error message from
TF commpilation, instead of just the generic message that
call_tf cannot be used with non-compileable functions.

											
										
										
											2023-04-27 13:42:23 +02:00
+								              "compilable functions with static output shapes.\n" +
-												Update references to the GitHub url in JAX codebase to reflect move from google/jax to jax-ml/jax

PiperOrigin-RevId: 676843138

											
										
										
											2024-09-20 07:51:48 -07:00
+								              "See https://github.com/jax-ml/jax/blob/main/jax/experimental/jax2tf/README.md#limitations-of-call_tf for a discussion." +
-												[call_tf] Some cleanup of call_tf

The main cleanup is around _code_generator_and_avals, which in
an earlier version of the code was used for both abstract values
and for code generation. That is why it was cached, and why it
returned a code generator and abstract values. A while
ago we did a first round of cleaning to not use it for abstract
values. Now we can actually eliminate the function and inline
it directly.

A second improvement is to add the explicit error message from
TF commpilation, instead of just the generic message that
call_tf cannot be used with non-compileable functions.

											
										
										
											2023-04-27 13:42:23 +02:00
+								             "\n\nCaught TensorFlow exception: " + str(e))
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
+								      raise ValueError(msg) from e
-												[jax2tf] Improved error checking for call_tf.

Cleaned up the abstract evaluation for call_tf to
work around a bug in TF whereby experimental_get_compiler_ir
cannot be used in a tf.function context.

Added more error messages, e.g., for the case when
the TF function has shape-influencing inputs.

											
										
										
											2021-07-10 18:49:25 +03:00
+								  xla_comp = xla_client.XlaComputation(func_tf_hlo)
 								  # Canonicalize the results; e.g., makes them x32 if JAX is in 32-bit mode
-												Remove more exported names from jax.interpreters.xla.

None of these appear to have public users, and this module is not included in the deprecation policy.

Also:
* shorten a number of alias chains.
* move make_op_metadata() into its only caller in jax2tf
* delete the unused function dtype_to_primitive_type.
PiperOrigin-RevId: 510205315

											
										
										
											2023-02-16 11:54:25 -08:00
+								  def canonical_res_aval(res_shape: xla_client.Shape) -> core.ShapedArray:
-												[jax2tf] Improved error checking for call_tf for functions with dynamic
shapes.

											
										
										
											2021-12-01 11:34:37 +02:00
+								    if not res_shape.is_static():
 								      msg = ("Compiled TensorFlow function has dynamic output shape " +
 								             f"{res_shape}. call_tf can used " +
 								             "in a staged context (under jax.jit, lax.scan, etc.) only with " +
-												Fix typo "compileable"->"compilable".

PiperOrigin-RevId: 517581258

											
										
										
											2023-03-17 21:50:26 -07:00
+								             "compilable functions with static output shapes. " +
-												Update references to the GitHub url in JAX codebase to reflect move from google/jax to jax-ml/jax

PiperOrigin-RevId: 676843138

											
										
										
											2024-09-20 07:51:48 -07:00
+								             "See https://github.com/jax-ml/jax/blob/main/jax/experimental/jax2tf/README.md#limitations-of-call_tf for a discussion.")
-												[jax2tf] Improved error checking for call_tf for functions with dynamic
shapes.

											
										
										
											2021-12-01 11:34:37 +02:00
+								      raise ValueError(msg)
-												[jax2tf] Improved error checking for call_tf.

Cleaned up the abstract evaluation for call_tf to
work around a bug in TF whereby experimental_get_compiler_ir
cannot be used in a tf.function context.

Added more error messages, e.g., for the case when
the TF function has shape-influencing inputs.

											
										
										
											2021-07-10 18:49:25 +03:00
+								    res_dtype = res_shape.numpy_dtype()
 								    jax_res_dtype = dtypes.canonicalize_dtype(res_dtype)
 								    return core.ShapedArray(res_shape.dimensions(), jax_res_dtype)
 								  result_shape = xla_comp.program_shape().result_shape()
 								  if not result_shape.is_tuple():
 								    # TF does not wrap singletons as tuples, but JAX expects tuples because
 								    # call_tf is a multiple_results primitive.
 								    result_shapes = (result_shape,)
 								  else:
-												[jax2tf] Refactored the handling of float0.

JAX and TF have different ways of dealing with tangents and co-tangents for
exact types. JAX uses float0 values. TF sometimes uses None, sometines
integer (or boolean) zeros. In the JAX VJP function we convert the
None's to zeros. On exit from the VJP function we convert the float0
to zeros.

											
										
										
											2021-07-27 15:50:47 +03:00
+								    result_shapes = result_shape.tuple_shapes()  # type: ignore
-												[jax2tf] Improved error checking for call_tf.

Cleaned up the abstract evaluation for call_tf to
work around a bug in TF whereby experimental_get_compiler_ir
cannot be used in a tf.function context.

Added more error messages, e.g., for the case when
the TF function has shape-influencing inputs.

											
										
										
											2021-07-10 18:49:25 +03:00
-												Removed noop # type: ignore comments

mypy should now flag these by default.

											
										
										
											2024-05-17 09:46:36 +01:00
+								  result_avals = tuple(map(canonical_res_aval, result_shapes))
-												[jax2tf] Improved error checking for call_tf.

Cleaned up the abstract evaluation for call_tf to
work around a bug in TF whereby experimental_get_compiler_ir
cannot be used in a tf.function context.

Added more error messages, e.g., for the case when
the TF function has shape-influencing inputs.

											
										
										
											2021-07-10 18:49:25 +03:00
-												[call_tf] Some cleanup of call_tf

The main cleanup is around _code_generator_and_avals, which in
an earlier version of the code was used for both abstract values
and for code generation. That is why it was cached, and why it
returned a code generator and abstract values. A while
ago we did a first round of cleaning to not use it for abstract
values. Now we can actually eliminate the function and inline
it directly.

A second improvement is to add the explicit error message from
TF commpilation, instead of just the generic message that
call_tf cannot be used with non-compileable functions.

											
										
										
											2023-04-27 13:42:23 +02:00
+								  submodule = mlir.xla_computation_to_mlir_module(xla_comp)
 								  symtab = ir.SymbolTable(submodule.operation)
 								  callee_result_types = symtab["main"].type.results
 								  fn = mlir.merge_mlir_modules(ctx.module_context.module,
 								                               f"call_tf_{function_flat_tf.name}",
-												Fix mlir.merge_mlir_modules to properly remember the inlined symbols

Previously, the `merge_mlir_modules` renamed the inlined symbols to
ensure they do not clash with the symbols in the destination module.
However, the inlined symbols were not inserted in the symbol table
so a conflict could arise later.

											
										
										
											2024-04-29 17:20:20 +03:00
+								                               submodule,
 								                               dst_symtab=ctx.module_context.symbol_table)
-												[call_tf] Some cleanup of call_tf

The main cleanup is around _code_generator_and_avals, which in
an earlier version of the code was used for both abstract values
and for code generation. That is why it was cached, and why it
returned a code generator and abstract values. A while
ago we did a first round of cleaning to not use it for abstract
values. Now we can actually eliminate the function and inline
it directly.

A second improvement is to add the explicit error message from
TF commpilation, instead of just the generic message that
call_tf cannot be used with non-compileable functions.

											
										
										
											2023-04-27 13:42:23 +02:00
+								  call = func_dialect.CallOp(callee_result_types,
 								                             ir.FlatSymbolRefAttr.get(fn),
 								                             tuple(args_op) + captured_ops)
-												Remove code present to support jaxlib < 0.5.1.

The new minimum xla_extension_version is 317 and the new mlir_api_version is 58.

											
										
										
											2025-02-24 17:45:19 -05:00
+								  flat_results = call.results
-												[MHLO] Switch call_tf to use an MHLO lowering (attempt 2).

In passing refactor and fix some bugs in the MHLO helper code:
* mlir.ir_constant() failed to propagate its canonicalize_types argument to its callee.
* Refactor the code to convert an XLA computation to an MHLO module and to merge two MHLO modules from the XLA fallback translation rule path.
* Fix symbol (alpha) renaming of call operator callees when merging MHLO modules.

Attempt 2: In this iteration of the merge_mhlo_modules function, move all the operators into the target module first before doing any symbol table manipulation.

PiperOrigin-RevId: 442904129

											
										
										
											2022-04-19 13:59:28 -07:00
-												Add (optional) ordered effects for `jax2tf.call_tf`

This allows users to express nested TensorFlow computation that must be ordered during execution. It leverages the existing JAX effects system to model such side effects and lower them to use XLA tokens.

With this change, `jax2tf.call_tf(ordered=True)` can be used to generate ordered TF calls. This has the following behavior:

* With `call_tf_graph=True`, this generates a custom call op with the following differences: (1) a `!stablehlo.token` argument/result is prepended to each custom call's argument/result list and (2) `tf.backend_config` has an additional `has_token_input_output = true` entry.
* Without `call_tf_graph=True`, this raises a `NotImplementedError()`.

For this, `jax_export.py` makes sure that dummy arguments/results added for ordered effects are not exposed to the public interface by passing constant values in a wrapper function. Because of this, adding ordered effects to jax2tf-ed computation no longer causes calling convention changes and can be safely allowed.

Example StableHLO produced from the added test:

```
module @jit_f_jax attributes {mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
  func.func public @main(%arg0: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.constant dense<> : tensor<0xi1>
    %1:2 = call @_wrapped_jax_export_main(%0, %arg0) : (tensor<0xi1>, tensor<f32>) -> (tensor<0xi1>, tensor<f32>)
    return %1#1 : tensor<f32>
  }
  func.func private @_wrapped_jax_export_main(%arg0: tensor<0xi1> {jax.token = true}, %arg1: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<0xi1> {jax.token = true}, tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.create_token : !stablehlo.token
    %1 = stablehlo.constant dense<0> : tensor<i32>
    %2:3 = stablehlo.while(%iterArg = %0, %iterArg_0 = %1, %iterArg_1 = %arg1) : !stablehlo.token, tensor<i32>, tensor<f32>
     cond {
      %4 = stablehlo.constant dense<4> : tensor<i32>
      %5 = stablehlo.compare  LT, %iterArg_0, %4,  SIGNED : (tensor<i32>, tensor<i32>) -> tensor<i1>
      stablehlo.return %5 : tensor<i1>
    } do {
      %4 = stablehlo.custom_call @tf.call_tf_function(%iterArg, %iterArg_1) {api_version = 2 : i32, has_side_effect = true, tf.backend_config = {caller_name = "__inference_callable_flat_tf_10", has_token_input_output = true}} : (!stablehlo.token, tensor<f32>) -> !stablehlo.token
      %5 = stablehlo.constant dense<1.000000e+00> : tensor<f32>
      %6 = stablehlo.add %iterArg_1, %5 : tensor<f32>
      %7 = stablehlo.constant dense<1> : tensor<i32>
      %8 = stablehlo.add %iterArg_0, %7 : tensor<i32>
      stablehlo.return %4, %8, %6 : !stablehlo.token, tensor<i32>, tensor<f32>
    }
    %3 = stablehlo.constant dense<> : tensor<0xi1>
    return %3, %2#2 : tensor<0xi1>, tensor<f32>
  }
}
```

PiperOrigin-RevId: 534926215

											
										
										
											2023-05-24 11:47:58 -07:00
+								  if ordered:
 								    raise NotImplementedError(
 								        "ordered=True is not supported in the jitted context without"
 								        " `call_tf_graph=True`"
 								    )
-												[call_tf] Some cleanup of call_tf

The main cleanup is around _code_generator_and_avals, which in
an earlier version of the code was used for both abstract values
and for code generation. That is why it was cached, and why it
returned a code generator and abstract values. A while
ago we did a first round of cleaning to not use it for abstract
values. Now we can actually eliminate the function and inline
it directly.

A second improvement is to add the explicit error message from
TF commpilation, instead of just the generic message that
call_tf cannot be used with non-compileable functions.

											
										
										
											2023-04-27 13:42:23 +02:00
+								  outputs = []
 								  for op, res_aval, res_shape in zip(flat_results, result_avals,
 								                                     result_shapes):
 								    if res_aval.dtype != res_shape.numpy_dtype():
 								      op = hlo.ConvertOp(mlir.aval_to_ir_type(res_aval), op).result
 								    outputs.append(op)
 								  return outputs
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
-												[call_tf] Use the same platform for TF lowering as the embedding JAX computation

This requires some changes for abstract evaluation, when
JAX does not use a specific platform.

Also attempt to fix the case when the TF lowering fails because the TF computation
uses a tf.Variable on another device as that used for lowering.

PiperOrigin-RevId: 492112847

											
										
										
											2022-11-30 23:21:55 -08:00
+								def _register_call_lowering(platform):
 								  mlir.register_lowering(call_tf_p, functools.partial(_call_tf_lowering,
 								                                                      platform=platform),
 								                         platform=platform)
 								for platform in ("cpu", "cuda", "tpu"):
 								  _register_call_lowering(platform)
-												Add an experimental mechanism for calling TensorFlow functions from JAX.

The TF function is called in eager mode if called outside a JAX staging
context, or if compiled using TF (``tf.function(jit_compile=True)``) if
called outside a staging context. Reverse-mode AD is supported, by
calling TensorFlow's ``tf.tape_gradient``.

In a staging context, the implementation uses TF to compile the function
to XLA, and then adds a call from JAX's computation to the compiled
TF function. All metadata that TF puts in the generated XLA is carried
over.

See the `jax.experimental.jax2tf.README` file for details.

											
										
										
											2021-02-04 10:56:13 +02:00
-												[shape_poly, call_tf] Some improvements for call_tf in a shape polymorphic program

This is another attempt to land a rolled-back change https://github.com/google/jax/pull/14734 (cl/514070997).
See b/272154366 for more details.

The use case for call_tf with shape polymorphism is when we have a JAX program
that calls into TF function, and we want to serialize the JAX program with
some shapes unknown. Previously this use case did not work, except in the special
case when the output shape of the called TF function returns statically known
shapes.

The idea is that we allow the user of call_tf to specify the output shape.
This can be done even in presence of shape polymorphism, by writing the
output shape as an expression in terms of the input shapes. This is what
other JAX primitives do, e.g., concat, so we are simply enabling call_tf
to get the same behavior.

This change should be enough for old-style jax2tf, but will require more
work for native serialization.

We also removed some old code that was trying to workaround some limitations
in shape inference in TF. I think that those workarounds are ugly, and I am
prepared to give error messages rather than keep that code. So far no
tests fail.

PiperOrigin-RevId: 515137407

											
										
										
											2023-03-08 14:09:35 -08:00
+								# Support the call_tf under jax2tf.convert in eager mode
-												[jax2tf] Fix the round-trip call_tf(convert)

Also cleaned the handling of global state in jax2tf.

											
										
										
											2021-06-10 17:01:22 +02:00
+								def _jax2tf_call_tf(*args: TfVal,
-												[call_tf] Improved call_tf for op-by-op executions.

There are two major improvements here. First we ensure that
in op-by-op execution we can even execute functions that are not
compileable. We do this by ensuring that we do not trace the
TF function to a graph too early.

The other improvement is to work around some bugs in the TF shape
inference. Some TF graphs has unknown output shapes even when traced
with known inputs shapes. This happens even for some graph that
are generated by jax2tf, which we know should have known shapes. To
work around this, we get the output shapes for the TF function using
the XLA compiler, which is more reliably able to figure out the output
shapes. We do this even during abstract evaluation of the call_tf
primitive, and we use caching to ensure we do not call the TF
compiler repeatedly.

											
										
										
											2021-06-25 07:39:09 +02:00
+								                    callable_flat_tf: Callable,
 								                    **_) -> TfVal:
-												[jax2tf] enable multiple round-trips from JAX to TF

											
										
										
											2021-07-30 13:35:21 +03:00
+								  with jax2tf_internal.inside_call_tf():
 								    res_tf_flat = callable_flat_tf(*args)
-												[jax2tf] Fix the round-trip call_tf(convert)

Also cleaned the handling of global state in jax2tf.

											
										
										
											2021-06-10 17:01:22 +02:00
+								  return res_tf_flat
-												[jax2tf] Improved error checking for call_tf.

Cleaned up the abstract evaluation for call_tf to
work around a bug in TF whereby experimental_get_compiler_ir
cannot be used in a tf.function context.

Added more error messages, e.g., for the case when
the TF function has shape-influencing inputs.

											
										
										
											2021-07-10 18:49:25 +03:00
+								jax2tf_internal.tf_impl[call_tf_p] = _jax2tf_call_tf
-												[1/n] store embedded tf.graph to stablehlo.custom_call

PiperOrigin-RevId: 519194911

											
										
										
											2023-03-24 11:26:44 -07:00
 								def emit_tf_embedded_graph_custom_call(
-												Add (optional) ordered effects for `jax2tf.call_tf`

This allows users to express nested TensorFlow computation that must be ordered during execution. It leverages the existing JAX effects system to model such side effects and lower them to use XLA tokens.

With this change, `jax2tf.call_tf(ordered=True)` can be used to generate ordered TF calls. This has the following behavior:

* With `call_tf_graph=True`, this generates a custom call op with the following differences: (1) a `!stablehlo.token` argument/result is prepended to each custom call's argument/result list and (2) `tf.backend_config` has an additional `has_token_input_output = true` entry.
* Without `call_tf_graph=True`, this raises a `NotImplementedError()`.

For this, `jax_export.py` makes sure that dummy arguments/results added for ordered effects are not exposed to the public interface by passing constant values in a wrapper function. Because of this, adding ordered effects to jax2tf-ed computation no longer causes calling convention changes and can be safely allowed.

Example StableHLO produced from the added test:

```
module @jit_f_jax attributes {mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
  func.func public @main(%arg0: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.constant dense<> : tensor<0xi1>
    %1:2 = call @_wrapped_jax_export_main(%0, %arg0) : (tensor<0xi1>, tensor<f32>) -> (tensor<0xi1>, tensor<f32>)
    return %1#1 : tensor<f32>
  }
  func.func private @_wrapped_jax_export_main(%arg0: tensor<0xi1> {jax.token = true}, %arg1: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<0xi1> {jax.token = true}, tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.create_token : !stablehlo.token
    %1 = stablehlo.constant dense<0> : tensor<i32>
    %2:3 = stablehlo.while(%iterArg = %0, %iterArg_0 = %1, %iterArg_1 = %arg1) : !stablehlo.token, tensor<i32>, tensor<f32>
     cond {
      %4 = stablehlo.constant dense<4> : tensor<i32>
      %5 = stablehlo.compare  LT, %iterArg_0, %4,  SIGNED : (tensor<i32>, tensor<i32>) -> tensor<i1>
      stablehlo.return %5 : tensor<i1>
    } do {
      %4 = stablehlo.custom_call @tf.call_tf_function(%iterArg, %iterArg_1) {api_version = 2 : i32, has_side_effect = true, tf.backend_config = {caller_name = "__inference_callable_flat_tf_10", has_token_input_output = true}} : (!stablehlo.token, tensor<f32>) -> !stablehlo.token
      %5 = stablehlo.constant dense<1.000000e+00> : tensor<f32>
      %6 = stablehlo.add %iterArg_1, %5 : tensor<f32>
      %7 = stablehlo.constant dense<1> : tensor<i32>
      %8 = stablehlo.add %iterArg_0, %7 : tensor<i32>
      stablehlo.return %4, %8, %6 : !stablehlo.token, tensor<i32>, tensor<f32>
    }
    %3 = stablehlo.constant dense<> : tensor<0xi1>
    return %3, %2#2 : tensor<0xi1>, tensor<f32>
  }
}
```

PiperOrigin-RevId: 534926215

											
										
										
											2023-05-24 11:47:58 -07:00
+								    ctx: mlir.LoweringRuleContext,
-												[1/n] store embedded tf.graph to stablehlo.custom_call

PiperOrigin-RevId: 519194911

											
										
										
											2023-03-24 11:26:44 -07:00
+								    concrete_function_flat_tf,
-												[call_tf] Some cleanup of call_tf

The main cleanup is around _code_generator_and_avals, which in
an earlier version of the code was used for both abstract values
and for code generation. That is why it was cached, and why it
returned a code generator and abstract values. A while
ago we did a first round of cleaning to not use it for abstract
values. Now we can actually eliminate the function and inline
it directly.

A second improvement is to add the explicit error message from
TF commpilation, instead of just the generic message that
call_tf cannot be used with non-compileable functions.

											
										
										
											2023-04-27 13:42:23 +02:00
+								    operands: Sequence[ir.Value],
-												[1/n] store embedded tf.graph to stablehlo.custom_call

PiperOrigin-RevId: 519194911

											
										
										
											2023-03-24 11:26:44 -07:00
+								    has_side_effects,
-												Add (optional) ordered effects for `jax2tf.call_tf`

This allows users to express nested TensorFlow computation that must be ordered during execution. It leverages the existing JAX effects system to model such side effects and lower them to use XLA tokens.

With this change, `jax2tf.call_tf(ordered=True)` can be used to generate ordered TF calls. This has the following behavior:

* With `call_tf_graph=True`, this generates a custom call op with the following differences: (1) a `!stablehlo.token` argument/result is prepended to each custom call's argument/result list and (2) `tf.backend_config` has an additional `has_token_input_output = true` entry.
* Without `call_tf_graph=True`, this raises a `NotImplementedError()`.

For this, `jax_export.py` makes sure that dummy arguments/results added for ordered effects are not exposed to the public interface by passing constant values in a wrapper function. Because of this, adding ordered effects to jax2tf-ed computation no longer causes calling convention changes and can be safely allowed.

Example StableHLO produced from the added test:

```
module @jit_f_jax attributes {mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
  func.func public @main(%arg0: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.constant dense<> : tensor<0xi1>
    %1:2 = call @_wrapped_jax_export_main(%0, %arg0) : (tensor<0xi1>, tensor<f32>) -> (tensor<0xi1>, tensor<f32>)
    return %1#1 : tensor<f32>
  }
  func.func private @_wrapped_jax_export_main(%arg0: tensor<0xi1> {jax.token = true}, %arg1: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<0xi1> {jax.token = true}, tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.create_token : !stablehlo.token
    %1 = stablehlo.constant dense<0> : tensor<i32>
    %2:3 = stablehlo.while(%iterArg = %0, %iterArg_0 = %1, %iterArg_1 = %arg1) : !stablehlo.token, tensor<i32>, tensor<f32>
     cond {
      %4 = stablehlo.constant dense<4> : tensor<i32>
      %5 = stablehlo.compare  LT, %iterArg_0, %4,  SIGNED : (tensor<i32>, tensor<i32>) -> tensor<i1>
      stablehlo.return %5 : tensor<i1>
    } do {
      %4 = stablehlo.custom_call @tf.call_tf_function(%iterArg, %iterArg_1) {api_version = 2 : i32, has_side_effect = true, tf.backend_config = {caller_name = "__inference_callable_flat_tf_10", has_token_input_output = true}} : (!stablehlo.token, tensor<f32>) -> !stablehlo.token
      %5 = stablehlo.constant dense<1.000000e+00> : tensor<f32>
      %6 = stablehlo.add %iterArg_1, %5 : tensor<f32>
      %7 = stablehlo.constant dense<1> : tensor<i32>
      %8 = stablehlo.add %iterArg_0, %7 : tensor<i32>
      stablehlo.return %4, %8, %6 : !stablehlo.token, tensor<i32>, tensor<f32>
    }
    %3 = stablehlo.constant dense<> : tensor<0xi1>
    return %3, %2#2 : tensor<0xi1>, tensor<f32>
  }
}
```

PiperOrigin-RevId: 534926215

											
										
										
											2023-05-24 11:47:58 -07:00
+								    ordered,
-												[1/n] store embedded tf.graph to stablehlo.custom_call

PiperOrigin-RevId: 519194911

											
										
										
											2023-03-24 11:26:44 -07:00
+								    output_avals,
 								):
-												[call_tf] Some cleanup of call_tf

The main cleanup is around _code_generator_and_avals, which in
an earlier version of the code was used for both abstract values
and for code generation. That is why it was cached, and why it
returned a code generator and abstract values. A while
ago we did a first round of cleaning to not use it for abstract
values. Now we can actually eliminate the function and inline
it directly.

A second improvement is to add the explicit error message from
TF commpilation, instead of just the generic message that
call_tf cannot be used with non-compileable functions.

											
										
										
											2023-04-27 13:42:23 +02:00
+								  """Emits a custom call referencing a tf.Graph embedding of the TF function.
-												[1/n] store embedded tf.graph to stablehlo.custom_call

PiperOrigin-RevId: 519194911

											
										
										
											2023-03-24 11:26:44 -07:00
-												Add new `called_index` to custom_call  `tf.backend_config` DictAttr.
Here, `called_index` indicates the tf concrete function index in the `function_list` of the parent XLACallModule.

PiperOrigin-RevId: 535417558

											
										
										
											2023-05-25 15:58:16 -07:00
+								  All call_tf called function information is stored in tf.metadata.
-												[1/n] store embedded tf.graph to stablehlo.custom_call

PiperOrigin-RevId: 519194911

											
										
										
											2023-03-24 11:26:44 -07:00
+								  This includes:
-												Add new `called_index` to custom_call  `tf.backend_config` DictAttr.
Here, `called_index` indicates the tf concrete function index in the `function_list` of the parent XLACallModule.

PiperOrigin-RevId: 535417558

											
										
										
											2023-05-25 15:58:16 -07:00
+								  (1) The called function name: This name will be used by the runtime to execute
-												[1/n] store embedded tf.graph to stablehlo.custom_call

PiperOrigin-RevId: 519194911

											
										
										
											2023-03-24 11:26:44 -07:00
+								  the callback.
-												Add new `called_index` to custom_call  `tf.backend_config` DictAttr.
Here, `called_index` indicates the tf concrete function index in the `function_list` of the parent XLACallModule.

PiperOrigin-RevId: 535417558

											
										
										
											2023-05-25 15:58:16 -07:00
+								  (2) The called function index in the XLACallModule `function_list` attribute.
-												[1/n] store embedded tf.graph to stablehlo.custom_call

PiperOrigin-RevId: 519194911

											
										
										
											2023-03-24 11:26:44 -07:00
+								  """
-												Add new `called_index` to custom_call  `tf.backend_config` DictAttr.
Here, `called_index` indicates the tf concrete function index in the `function_list` of the parent XLACallModule.

PiperOrigin-RevId: 535417558

											
										
										
											2023-05-25 15:58:16 -07:00
+								  call_tf_concrete_function_list = jax2tf_internal.get_thread_local_state_call_tf_concrete_function_list()
 								  if call_tf_concrete_function_list is None:
 								    raise ValueError(
 								        "call_tf_graph=True only support exporting by jax2tf.convert currently."
 								    )
-												[call_tf] Fix call_tf lowering for multi-platform lowering

call_tf has per-platform lowering because the lowering
of the called TF function may depend on the platform. When
doing multi-platform lowering this means that we lower
call_tf several times and wrap the lowerings with a
conditional. This results in an assertion failure
in add_to_call_tf_concrete_function_list, because we
are attempting to add the same function multiple times.

Here we remove the assertion (afaik, it is Ok to add
multiple functions with the same name, because all
we care about is the index of the called function in
the list). We also reuse the existing function if
we are adding an identical one.

We add tests for call_tf with multi-platform lowering.

											
										
										
											2023-10-13 09:42:12 -07:00
+								  # TODO(necula): It is dangerous to modify global state when lowering because
 								  # there are a number of lowering caches that only cache the StableHLO.
 								  # See call_tf_test.py:test_multi_platform_call_tf_graph.
-												Add new `called_index` to custom_call  `tf.backend_config` DictAttr.
Here, `called_index` indicates the tf concrete function index in the `function_list` of the parent XLACallModule.

PiperOrigin-RevId: 535417558

											
										
										
											2023-05-25 15:58:16 -07:00
+								  called_index = add_to_call_tf_concrete_function_list(
 								      concrete_function_flat_tf, call_tf_concrete_function_list)
-												Bump XLACallModule to version 5 and add the function_list.

PiperOrigin-RevId: 529106145

											
										
										
											2023-05-03 09:04:01 -07:00
+								  tf_backend_config = {
-												Add (optional) ordered effects for `jax2tf.call_tf`

This allows users to express nested TensorFlow computation that must be ordered during execution. It leverages the existing JAX effects system to model such side effects and lower them to use XLA tokens.

With this change, `jax2tf.call_tf(ordered=True)` can be used to generate ordered TF calls. This has the following behavior:

* With `call_tf_graph=True`, this generates a custom call op with the following differences: (1) a `!stablehlo.token` argument/result is prepended to each custom call's argument/result list and (2) `tf.backend_config` has an additional `has_token_input_output = true` entry.
* Without `call_tf_graph=True`, this raises a `NotImplementedError()`.

For this, `jax_export.py` makes sure that dummy arguments/results added for ordered effects are not exposed to the public interface by passing constant values in a wrapper function. Because of this, adding ordered effects to jax2tf-ed computation no longer causes calling convention changes and can be safely allowed.

Example StableHLO produced from the added test:

```
module @jit_f_jax attributes {mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
  func.func public @main(%arg0: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.constant dense<> : tensor<0xi1>
    %1:2 = call @_wrapped_jax_export_main(%0, %arg0) : (tensor<0xi1>, tensor<f32>) -> (tensor<0xi1>, tensor<f32>)
    return %1#1 : tensor<f32>
  }
  func.func private @_wrapped_jax_export_main(%arg0: tensor<0xi1> {jax.token = true}, %arg1: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<0xi1> {jax.token = true}, tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.create_token : !stablehlo.token
    %1 = stablehlo.constant dense<0> : tensor<i32>
    %2:3 = stablehlo.while(%iterArg = %0, %iterArg_0 = %1, %iterArg_1 = %arg1) : !stablehlo.token, tensor<i32>, tensor<f32>
     cond {
      %4 = stablehlo.constant dense<4> : tensor<i32>
      %5 = stablehlo.compare  LT, %iterArg_0, %4,  SIGNED : (tensor<i32>, tensor<i32>) -> tensor<i1>
      stablehlo.return %5 : tensor<i1>
    } do {
      %4 = stablehlo.custom_call @tf.call_tf_function(%iterArg, %iterArg_1) {api_version = 2 : i32, has_side_effect = true, tf.backend_config = {caller_name = "__inference_callable_flat_tf_10", has_token_input_output = true}} : (!stablehlo.token, tensor<f32>) -> !stablehlo.token
      %5 = stablehlo.constant dense<1.000000e+00> : tensor<f32>
      %6 = stablehlo.add %iterArg_1, %5 : tensor<f32>
      %7 = stablehlo.constant dense<1> : tensor<i32>
      %8 = stablehlo.add %iterArg_0, %7 : tensor<i32>
      stablehlo.return %4, %8, %6 : !stablehlo.token, tensor<i32>, tensor<f32>
    }
    %3 = stablehlo.constant dense<> : tensor<0xi1>
    return %3, %2#2 : tensor<0xi1>, tensor<f32>
  }
}
```

PiperOrigin-RevId: 534926215

											
										
										
											2023-05-24 11:47:58 -07:00
+								      "has_token_input_output": ir.BoolAttr.get(ordered),
-												Add new `called_index` to custom_call  `tf.backend_config` DictAttr.
Here, `called_index` indicates the tf concrete function index in the `function_list` of the parent XLACallModule.

PiperOrigin-RevId: 535417558

											
										
										
											2023-05-25 15:58:16 -07:00
+								      "called_index": mlir.i64_attr(called_index),
-												[1/n] store embedded tf.graph to stablehlo.custom_call

PiperOrigin-RevId: 519194911

											
										
										
											2023-03-24 11:26:44 -07:00
+								  }
-												ENH Use {} and () instead of dict() and tuple()

											
										
										
											2023-09-22 09:05:42 +01:00
+								  result_avals = ctx.avals_out if ctx.avals_out is not None else ()
-												[1/n] store embedded tf.graph to stablehlo.custom_call

PiperOrigin-RevId: 519194911

											
										
										
											2023-03-24 11:26:44 -07:00
-												Add (optional) ordered effects for `jax2tf.call_tf`

This allows users to express nested TensorFlow computation that must be ordered during execution. It leverages the existing JAX effects system to model such side effects and lower them to use XLA tokens.

With this change, `jax2tf.call_tf(ordered=True)` can be used to generate ordered TF calls. This has the following behavior:

* With `call_tf_graph=True`, this generates a custom call op with the following differences: (1) a `!stablehlo.token` argument/result is prepended to each custom call's argument/result list and (2) `tf.backend_config` has an additional `has_token_input_output = true` entry.
* Without `call_tf_graph=True`, this raises a `NotImplementedError()`.

For this, `jax_export.py` makes sure that dummy arguments/results added for ordered effects are not exposed to the public interface by passing constant values in a wrapper function. Because of this, adding ordered effects to jax2tf-ed computation no longer causes calling convention changes and can be safely allowed.

Example StableHLO produced from the added test:

```
module @jit_f_jax attributes {mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
  func.func public @main(%arg0: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.constant dense<> : tensor<0xi1>
    %1:2 = call @_wrapped_jax_export_main(%0, %arg0) : (tensor<0xi1>, tensor<f32>) -> (tensor<0xi1>, tensor<f32>)
    return %1#1 : tensor<f32>
  }
  func.func private @_wrapped_jax_export_main(%arg0: tensor<0xi1> {jax.token = true}, %arg1: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<0xi1> {jax.token = true}, tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.create_token : !stablehlo.token
    %1 = stablehlo.constant dense<0> : tensor<i32>
    %2:3 = stablehlo.while(%iterArg = %0, %iterArg_0 = %1, %iterArg_1 = %arg1) : !stablehlo.token, tensor<i32>, tensor<f32>
     cond {
      %4 = stablehlo.constant dense<4> : tensor<i32>
      %5 = stablehlo.compare  LT, %iterArg_0, %4,  SIGNED : (tensor<i32>, tensor<i32>) -> tensor<i1>
      stablehlo.return %5 : tensor<i1>
    } do {
      %4 = stablehlo.custom_call @tf.call_tf_function(%iterArg, %iterArg_1) {api_version = 2 : i32, has_side_effect = true, tf.backend_config = {caller_name = "__inference_callable_flat_tf_10", has_token_input_output = true}} : (!stablehlo.token, tensor<f32>) -> !stablehlo.token
      %5 = stablehlo.constant dense<1.000000e+00> : tensor<f32>
      %6 = stablehlo.add %iterArg_1, %5 : tensor<f32>
      %7 = stablehlo.constant dense<1> : tensor<i32>
      %8 = stablehlo.add %iterArg_0, %7 : tensor<i32>
      stablehlo.return %4, %8, %6 : !stablehlo.token, tensor<i32>, tensor<f32>
    }
    %3 = stablehlo.constant dense<> : tensor<0xi1>
    return %3, %2#2 : tensor<0xi1>, tensor<f32>
  }
}
```

PiperOrigin-RevId: 534926215

											
										
										
											2023-05-24 11:47:58 -07:00
+								  operands = list(operands)
 								  result_types = list(
-												Don't wrap singleton ir.Types during HLO lowering.

This is similar to https://github.com/google/jax/pull/22211, but for MLIR types instead of MLIR values.

											
										
										
											2024-07-03 16:38:18 -04:00
+								      mlir.flatten_ir_types([mlir.aval_to_ir_type(aval) for aval in result_avals])
-												[1/n] store embedded tf.graph to stablehlo.custom_call

PiperOrigin-RevId: 519194911

											
										
										
											2023-03-24 11:26:44 -07:00
+								  )
-												Add (optional) ordered effects for `jax2tf.call_tf`

This allows users to express nested TensorFlow computation that must be ordered during execution. It leverages the existing JAX effects system to model such side effects and lower them to use XLA tokens.

With this change, `jax2tf.call_tf(ordered=True)` can be used to generate ordered TF calls. This has the following behavior:

* With `call_tf_graph=True`, this generates a custom call op with the following differences: (1) a `!stablehlo.token` argument/result is prepended to each custom call's argument/result list and (2) `tf.backend_config` has an additional `has_token_input_output = true` entry.
* Without `call_tf_graph=True`, this raises a `NotImplementedError()`.

For this, `jax_export.py` makes sure that dummy arguments/results added for ordered effects are not exposed to the public interface by passing constant values in a wrapper function. Because of this, adding ordered effects to jax2tf-ed computation no longer causes calling convention changes and can be safely allowed.

Example StableHLO produced from the added test:

```
module @jit_f_jax attributes {mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
  func.func public @main(%arg0: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.constant dense<> : tensor<0xi1>
    %1:2 = call @_wrapped_jax_export_main(%0, %arg0) : (tensor<0xi1>, tensor<f32>) -> (tensor<0xi1>, tensor<f32>)
    return %1#1 : tensor<f32>
  }
  func.func private @_wrapped_jax_export_main(%arg0: tensor<0xi1> {jax.token = true}, %arg1: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<0xi1> {jax.token = true}, tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.create_token : !stablehlo.token
    %1 = stablehlo.constant dense<0> : tensor<i32>
    %2:3 = stablehlo.while(%iterArg = %0, %iterArg_0 = %1, %iterArg_1 = %arg1) : !stablehlo.token, tensor<i32>, tensor<f32>
     cond {
      %4 = stablehlo.constant dense<4> : tensor<i32>
      %5 = stablehlo.compare  LT, %iterArg_0, %4,  SIGNED : (tensor<i32>, tensor<i32>) -> tensor<i1>
      stablehlo.return %5 : tensor<i1>
    } do {
      %4 = stablehlo.custom_call @tf.call_tf_function(%iterArg, %iterArg_1) {api_version = 2 : i32, has_side_effect = true, tf.backend_config = {caller_name = "__inference_callable_flat_tf_10", has_token_input_output = true}} : (!stablehlo.token, tensor<f32>) -> !stablehlo.token
      %5 = stablehlo.constant dense<1.000000e+00> : tensor<f32>
      %6 = stablehlo.add %iterArg_1, %5 : tensor<f32>
      %7 = stablehlo.constant dense<1> : tensor<i32>
      %8 = stablehlo.add %iterArg_0, %7 : tensor<i32>
      stablehlo.return %4, %8, %6 : !stablehlo.token, tensor<i32>, tensor<f32>
    }
    %3 = stablehlo.constant dense<> : tensor<0xi1>
    return %3, %2#2 : tensor<0xi1>, tensor<f32>
  }
}
```

PiperOrigin-RevId: 534926215

											
										
										
											2023-05-24 11:47:58 -07:00
+								  if ordered:
-												Don't wrap singleton ir.Values with tuples during HLO lowering.

In general a JAX value might correspond to multiple HLO values, which is why the HLO lowering represents each value as a tuple of zero or more ir.Values. However, the common case is that there is exactly one value, and almost all such lists are singletons.

To reduce the number of singleton list and tuple objects allocated during MLIR lowering, instead represent singleton values as unwrapped ir.Values, and only use a tuple if there is not exactly one ir.Value backing a JAX value.

											
										
										
											2024-07-01 08:42:48 -04:00
+								    operands.insert(0, ctx.tokens_in.get(call_tf_ordered_effect))
-												Don't wrap singleton ir.Types during HLO lowering.

This is similar to https://github.com/google/jax/pull/22211, but for MLIR types instead of MLIR values.

											
										
										
											2024-07-03 16:38:18 -04:00
+								    result_types.insert(0, mlir.token_type())
-												Add (optional) ordered effects for `jax2tf.call_tf`

This allows users to express nested TensorFlow computation that must be ordered during execution. It leverages the existing JAX effects system to model such side effects and lower them to use XLA tokens.

With this change, `jax2tf.call_tf(ordered=True)` can be used to generate ordered TF calls. This has the following behavior:

* With `call_tf_graph=True`, this generates a custom call op with the following differences: (1) a `!stablehlo.token` argument/result is prepended to each custom call's argument/result list and (2) `tf.backend_config` has an additional `has_token_input_output = true` entry.
* Without `call_tf_graph=True`, this raises a `NotImplementedError()`.

For this, `jax_export.py` makes sure that dummy arguments/results added for ordered effects are not exposed to the public interface by passing constant values in a wrapper function. Because of this, adding ordered effects to jax2tf-ed computation no longer causes calling convention changes and can be safely allowed.

Example StableHLO produced from the added test:

```
module @jit_f_jax attributes {mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
  func.func public @main(%arg0: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.constant dense<> : tensor<0xi1>
    %1:2 = call @_wrapped_jax_export_main(%0, %arg0) : (tensor<0xi1>, tensor<f32>) -> (tensor<0xi1>, tensor<f32>)
    return %1#1 : tensor<f32>
  }
  func.func private @_wrapped_jax_export_main(%arg0: tensor<0xi1> {jax.token = true}, %arg1: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<0xi1> {jax.token = true}, tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.create_token : !stablehlo.token
    %1 = stablehlo.constant dense<0> : tensor<i32>
    %2:3 = stablehlo.while(%iterArg = %0, %iterArg_0 = %1, %iterArg_1 = %arg1) : !stablehlo.token, tensor<i32>, tensor<f32>
     cond {
      %4 = stablehlo.constant dense<4> : tensor<i32>
      %5 = stablehlo.compare  LT, %iterArg_0, %4,  SIGNED : (tensor<i32>, tensor<i32>) -> tensor<i1>
      stablehlo.return %5 : tensor<i1>
    } do {
      %4 = stablehlo.custom_call @tf.call_tf_function(%iterArg, %iterArg_1) {api_version = 2 : i32, has_side_effect = true, tf.backend_config = {caller_name = "__inference_callable_flat_tf_10", has_token_input_output = true}} : (!stablehlo.token, tensor<f32>) -> !stablehlo.token
      %5 = stablehlo.constant dense<1.000000e+00> : tensor<f32>
      %6 = stablehlo.add %iterArg_1, %5 : tensor<f32>
      %7 = stablehlo.constant dense<1> : tensor<i32>
      %8 = stablehlo.add %iterArg_0, %7 : tensor<i32>
      stablehlo.return %4, %8, %6 : !stablehlo.token, tensor<i32>, tensor<f32>
    }
    %3 = stablehlo.constant dense<> : tensor<0xi1>
    return %3, %2#2 : tensor<0xi1>, tensor<f32>
  }
}
```

PiperOrigin-RevId: 534926215

											
										
										
											2023-05-24 11:47:58 -07:00
 								  custom_call = hlo.CustomCallOp(
-												[1/n] store embedded tf.graph to stablehlo.custom_call

PiperOrigin-RevId: 519194911

											
										
										
											2023-03-24 11:26:44 -07:00
+								      result_types,
 								      operands,
-												[call_tf] Fix call_tf lowering for multi-platform lowering

call_tf has per-platform lowering because the lowering
of the called TF function may depend on the platform. When
doing multi-platform lowering this means that we lower
call_tf several times and wrap the lowerings with a
conditional. This results in an assertion failure
in add_to_call_tf_concrete_function_list, because we
are attempting to add the same function multiple times.

Here we remove the assertion (afaik, it is Ok to add
multiple functions with the same name, because all
we care about is the index of the called function in
the list). We also reuse the existing function if
we are adding an identical one.

We add tests for call_tf with multi-platform lowering.

											
										
										
											2023-10-13 09:42:12 -07:00
+								      call_target_name=ir.StringAttr.get("tf.call_tf_function"),
-												[1/n] store embedded tf.graph to stablehlo.custom_call

PiperOrigin-RevId: 519194911

											
										
										
											2023-03-24 11:26:44 -07:00
+								      has_side_effect=ir.BoolAttr.get(has_side_effects),
 								      api_version=mlir.i32_attr(2),
 								      called_computations=ir.ArrayAttr.get([]),
 								      backend_config=ir.StringAttr.get(""),
 								  )
 								  # Store TF metadata in unregistered attribute
-												Add (optional) ordered effects for `jax2tf.call_tf`

This allows users to express nested TensorFlow computation that must be ordered during execution. It leverages the existing JAX effects system to model such side effects and lower them to use XLA tokens.

With this change, `jax2tf.call_tf(ordered=True)` can be used to generate ordered TF calls. This has the following behavior:

* With `call_tf_graph=True`, this generates a custom call op with the following differences: (1) a `!stablehlo.token` argument/result is prepended to each custom call's argument/result list and (2) `tf.backend_config` has an additional `has_token_input_output = true` entry.
* Without `call_tf_graph=True`, this raises a `NotImplementedError()`.

For this, `jax_export.py` makes sure that dummy arguments/results added for ordered effects are not exposed to the public interface by passing constant values in a wrapper function. Because of this, adding ordered effects to jax2tf-ed computation no longer causes calling convention changes and can be safely allowed.

Example StableHLO produced from the added test:

```
module @jit_f_jax attributes {mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
  func.func public @main(%arg0: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.constant dense<> : tensor<0xi1>
    %1:2 = call @_wrapped_jax_export_main(%0, %arg0) : (tensor<0xi1>, tensor<f32>) -> (tensor<0xi1>, tensor<f32>)
    return %1#1 : tensor<f32>
  }
  func.func private @_wrapped_jax_export_main(%arg0: tensor<0xi1> {jax.token = true}, %arg1: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<0xi1> {jax.token = true}, tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.create_token : !stablehlo.token
    %1 = stablehlo.constant dense<0> : tensor<i32>
    %2:3 = stablehlo.while(%iterArg = %0, %iterArg_0 = %1, %iterArg_1 = %arg1) : !stablehlo.token, tensor<i32>, tensor<f32>
     cond {
      %4 = stablehlo.constant dense<4> : tensor<i32>
      %5 = stablehlo.compare  LT, %iterArg_0, %4,  SIGNED : (tensor<i32>, tensor<i32>) -> tensor<i1>
      stablehlo.return %5 : tensor<i1>
    } do {
      %4 = stablehlo.custom_call @tf.call_tf_function(%iterArg, %iterArg_1) {api_version = 2 : i32, has_side_effect = true, tf.backend_config = {caller_name = "__inference_callable_flat_tf_10", has_token_input_output = true}} : (!stablehlo.token, tensor<f32>) -> !stablehlo.token
      %5 = stablehlo.constant dense<1.000000e+00> : tensor<f32>
      %6 = stablehlo.add %iterArg_1, %5 : tensor<f32>
      %7 = stablehlo.constant dense<1> : tensor<i32>
      %8 = stablehlo.add %iterArg_0, %7 : tensor<i32>
      stablehlo.return %4, %8, %6 : !stablehlo.token, tensor<i32>, tensor<f32>
    }
    %3 = stablehlo.constant dense<> : tensor<0xi1>
    return %3, %2#2 : tensor<0xi1>, tensor<f32>
  }
}
```

PiperOrigin-RevId: 534926215

											
										
										
											2023-05-24 11:47:58 -07:00
+								  custom_call.attributes["tf.backend_config"] = ir.DictAttr.get(
 								      tf_backend_config
 								  )
 								  results = list(custom_call.results)
 								  if ordered:
 								    token = results.pop(0)
-												Don't wrap singleton ir.Values with tuples during HLO lowering.

In general a JAX value might correspond to multiple HLO values, which is why the HLO lowering represents each value as a tuple of zero or more ir.Values. However, the common case is that there is exactly one value, and almost all such lists are singletons.

To reduce the number of singleton list and tuple objects allocated during MLIR lowering, instead represent singleton values as unwrapped ir.Values, and only use a tuple if there is not exactly one ir.Value backing a JAX value.

											
										
										
											2024-07-01 08:42:48 -04:00
+								    ctx.set_tokens_out(mlir.TokenSet({call_tf_ordered_effect: token}))
-												Add (optional) ordered effects for `jax2tf.call_tf`

This allows users to express nested TensorFlow computation that must be ordered during execution. It leverages the existing JAX effects system to model such side effects and lower them to use XLA tokens.

With this change, `jax2tf.call_tf(ordered=True)` can be used to generate ordered TF calls. This has the following behavior:

* With `call_tf_graph=True`, this generates a custom call op with the following differences: (1) a `!stablehlo.token` argument/result is prepended to each custom call's argument/result list and (2) `tf.backend_config` has an additional `has_token_input_output = true` entry.
* Without `call_tf_graph=True`, this raises a `NotImplementedError()`.

For this, `jax_export.py` makes sure that dummy arguments/results added for ordered effects are not exposed to the public interface by passing constant values in a wrapper function. Because of this, adding ordered effects to jax2tf-ed computation no longer causes calling convention changes and can be safely allowed.

Example StableHLO produced from the added test:

```
module @jit_f_jax attributes {mhlo.num_partitions = 1 : i32, mhlo.num_replicas = 1 : i32} {
  func.func public @main(%arg0: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.constant dense<> : tensor<0xi1>
    %1:2 = call @_wrapped_jax_export_main(%0, %arg0) : (tensor<0xi1>, tensor<f32>) -> (tensor<0xi1>, tensor<f32>)
    return %1#1 : tensor<f32>
  }
  func.func private @_wrapped_jax_export_main(%arg0: tensor<0xi1> {jax.token = true}, %arg1: tensor<f32> {jax.arg_info = "x", mhlo.sharding = "{replicated}"}) -> (tensor<0xi1> {jax.token = true}, tensor<f32> {jax.result_info = ""}) {
    %0 = stablehlo.create_token : !stablehlo.token
    %1 = stablehlo.constant dense<0> : tensor<i32>
    %2:3 = stablehlo.while(%iterArg = %0, %iterArg_0 = %1, %iterArg_1 = %arg1) : !stablehlo.token, tensor<i32>, tensor<f32>
     cond {
      %4 = stablehlo.constant dense<4> : tensor<i32>
      %5 = stablehlo.compare  LT, %iterArg_0, %4,  SIGNED : (tensor<i32>, tensor<i32>) -> tensor<i1>
      stablehlo.return %5 : tensor<i1>
    } do {
      %4 = stablehlo.custom_call @tf.call_tf_function(%iterArg, %iterArg_1) {api_version = 2 : i32, has_side_effect = true, tf.backend_config = {caller_name = "__inference_callable_flat_tf_10", has_token_input_output = true}} : (!stablehlo.token, tensor<f32>) -> !stablehlo.token
      %5 = stablehlo.constant dense<1.000000e+00> : tensor<f32>
      %6 = stablehlo.add %iterArg_1, %5 : tensor<f32>
      %7 = stablehlo.constant dense<1> : tensor<i32>
      %8 = stablehlo.add %iterArg_0, %7 : tensor<i32>
      stablehlo.return %4, %8, %6 : !stablehlo.token, tensor<i32>, tensor<f32>
    }
    %3 = stablehlo.constant dense<> : tensor<0xi1>
    return %3, %2#2 : tensor<0xi1>, tensor<f32>
  }
}
```

PiperOrigin-RevId: 534926215

											
										
										
											2023-05-24 11:47:58 -07:00
 								  return results
-												Add new `called_index` to custom_call  `tf.backend_config` DictAttr.
Here, `called_index` indicates the tf concrete function index in the `function_list` of the parent XLACallModule.

PiperOrigin-RevId: 535417558

											
										
										
											2023-05-25 15:58:16 -07:00
-												Use lower-case PEP 585 names for types.

Issue https://github.com/google/jax/issues/16537

PiperOrigin-RevId: 542969282

											
										
										
											2023-06-23 15:11:37 -07:00
+								def add_to_call_tf_concrete_function_list(concrete_tf_fn: Any, call_tf_concrete_function_list: list[Any]) -> int:
-												[call_tf] Fix call_tf lowering for multi-platform lowering

call_tf has per-platform lowering because the lowering
of the called TF function may depend on the platform. When
doing multi-platform lowering this means that we lower
call_tf several times and wrap the lowerings with a
conditional. This results in an assertion failure
in add_to_call_tf_concrete_function_list, because we
are attempting to add the same function multiple times.

Here we remove the assertion (afaik, it is Ok to add
multiple functions with the same name, because all
we care about is the index of the called function in
the list). We also reuse the existing function if
we are adding an identical one.

We add tests for call_tf with multi-platform lowering.

											
										
										
											2023-10-13 09:42:12 -07:00
+								  try:
 								    called_index = call_tf_concrete_function_list.index(concrete_tf_fn)
 								  except ValueError:
 								    called_index = len(call_tf_concrete_function_list)
 								    call_tf_concrete_function_list.append(concrete_tf_fn)
-												Add new `called_index` to custom_call  `tf.backend_config` DictAttr.
Here, `called_index` indicates the tf concrete function index in the `function_list` of the parent XLACallModule.

PiperOrigin-RevId: 535417558

											
										
										
											2023-05-25 15:58:16 -07:00
+								  return called_index