rocm_jax/jax/interpreters/batching.py

# Copyright 2018 Google LLC
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     https://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

from __future__ import absolute_import
from __future__ import division
from __future__ import print_function

from collections import namedtuple

import itertools as it

import numpy as onp

from six.moves import reduce

from .. import core
from ..core import Trace, Tracer, new_master, pack, AbstractTuple, JaxTuple
from ..abstract_arrays import ShapedArray, make_shaped_array, array_types
from ..ad_util import add_jaxvals_p, zeros_like_p, zeros_like_jaxval
from ..linear_util import transformation, transformation_with_aux, wrap_init
from ..tree_util import register_pytree_node
from ..util import unzip2, partial, safe_map

map = safe_map


def batch(fun, in_vals, in_dims, out_dim_target):
  sizes = reduce(set.union, map(dimsize, in_dims, in_vals))
  if not sizes:
    return fun.call_wrapped(*in_vals), None  # no mapped dimensions
  elif len(sizes) == 1:
    out_val, out_dim = batch_transform(fun).call_wrapped(in_vals, in_dims)
    return moveaxis(sizes.pop(), out_dim_target, out_dim, out_val)
  else:
    raise TypeError("got inconsistent map dimension sizes: {}".format(sizes))


# TODO(mattjj,dougalm): could call batch_subtrace here (a bit redundant)
@transformation
def batch_transform(vals, dims):
  with new_master(BatchTrace) as master:
    trace = BatchTrace(master, core.cur_sublevel())
    in_tracers = map(partial(BatchTracer, trace), vals, dims)
    out_tracer = yield in_tracers
    out_tracer = trace.full_raise(out_tracer)
    out_val, out_dim = out_tracer.val, out_tracer.batch_dim
    del master
  yield (out_val, out_dim)


@transformation_with_aux
def batch_subtrace(master, dims, *vals):
  trace = BatchTrace(master, core.cur_sublevel())
  ans = yield map(partial(BatchTracer, trace), vals, dims)
  out_tracer = trace.full_raise(ans)
  out_val, out_dim = out_tracer.val, out_tracer.batch_dim
  yield out_val, out_dim


### tracer


class BatchTracer(Tracer):
  def __init__(self, trace, val, batch_dim):
    self.trace = trace
    self.val = val
    self.batch_dim = batch_dim

  @property
  def aval(self):
    batched_aval = get_aval(self.val)
    return remove_batch_dim_from_aval(self.batch_dim, batched_aval)

  def unpack(self):
    t = type(self.batch_dim)
    if t is tuple:
      batch_dims = self.batch_dim
    elif t is int:
      batch_dims = [self.batch_dim] * len(self.val)
    elif t is type(None):
      return tuple(self.val)
    else:
      raise TypeError(t)
    return map(partial(BatchTracer, self.trace), self.val, batch_dims)

  def full_lower(self):
    if self.batch_dim is None:
      return core.full_lower(self.val)
    else:
      return self

class BatchTrace(Trace):
  def pure(self, val):
    return BatchTracer(self, val, None)

  def lift(self, val):
    return BatchTracer(self, val, None)

  def sublift(self, val):
    return BatchTracer(self, val.val, val.batch_dim)

  def process_primitive(self, primitive, tracers, params):
    vals_in, dims_in = unzip2((t.val, t.batch_dim) for t in tracers)
    if all(bdim is None for bdim in dims_in):
      return primitive.bind(*vals_in, **params)
    else:
      batched_primitive = get_primitive_batcher(primitive)
      val_out, dim_out = batched_primitive(vals_in, dims_in, **params)
      return BatchTracer(self, val_out, dim_out)

  def process_call(self, call_primitive, f, tracers, params):
    vals, dims = unzip2((t.val, t.batch_dim) for t in tracers)
    if all(bdim is None for bdim in dims):
      return call_primitive.bind(f, *vals, **params)
    else:
      f, dim_out = batch_subtrace(f, self.master, dims)
      val_out = call_primitive.bind(f, *vals, **params)
      return BatchTracer(self, val_out, dim_out())

  def post_process_call(self, _, out_tracer):
    raise NotImplementedError  # TODO(mattjj,dougalm)

  def pack(self, tracers):
    vals = pack([t.val for t in tracers])
    batch_dim = tuple(t.batch_dim for t in tracers)
    return BatchTracer(self, vals, batch_dim)


### abstract values


def get_aval(x):
  if isinstance(x, Tracer):
    return raise_to_shaped(x.aval)
  else:
    return shaped_aval(x)

def shaped_aval(x):
  try:
    return pytype_aval_mappings[type(x)](x)
  except KeyError:
    raise TypeError("{} is not a valid type for batching".format(type(x)))

def raise_to_shaped(aval):
  if type(aval) is AbstractTuple:
    return AbstractTuple(map(raise_to_shaped, aval))
  elif isinstance(aval, ShapedArray):
    return ShapedArray(aval.shape, aval.dtype)
  else:
    raise TypeError(type(aval))

def remove_batch_dim_from_aval(bdim, aval):
  t = type(aval)
  if t is AbstractTuple:
    if type(bdim) is tuple:
      return AbstractTuple(map(remove_batch_dim_from_aval, bdim, aval))
    else:
      return AbstractTuple(map(partial(remove_batch_dim_from_aval, bdim), aval))
  elif t is ShapedArray:
    if bdim is None:
      return ShapedArray(aval.shape, aval.dtype)
    else:
      assert 0 <= bdim < aval.ndim
      unbatched_shape = tuple(onp.delete(aval.shape, bdim))
      return ShapedArray(unbatched_shape, aval.dtype)
  else:
    raise TypeError(t)

pytype_aval_mappings = {}

def shaped_jaxtuple(xs):
  return AbstractTuple(map(shaped_aval, xs))

pytype_aval_mappings[JaxTuple] = shaped_jaxtuple

for t in array_types:
  pytype_aval_mappings[t] = make_shaped_array


### primitives


primitive_batchers = {}

def get_primitive_batcher(p):
  try:
    return primitive_batchers[p]
  except KeyError:
    raise NotImplementedError(
        "Batching rule for '{}' not implemented".format(p))

def defvectorized(prim):
  primitive_batchers[prim] = partial(vectorized_batcher, prim)

def vectorized_batcher(prim, batched_args, batch_dims, **params):
  assert all(batch_dims[0] == bd for bd in batch_dims[1:])
  return prim.bind(*batched_args, **params), batch_dims[0]

def defbroadcasting(prim):
  primitive_batchers[prim] = partial(broadcast_batcher, prim)

def broadcast_batcher(prim, batched_args, batch_dims, **params):
  args = map(bdim_at_front, batched_args, batch_dims)
  ndim = max(map(onp.ndim, args))  # special case to handle scalar broadcasting
  args = map(partial(handle_scalar_broadcasting, ndim), args, batch_dims)
  return prim.bind(*args, **params), 0

def defreducer(prim):
  primitive_batchers[prim] = partial(reducer_batcher, prim)

def reducer_batcher(prim, batched_args, batch_dims, axes, **kwargs):
  operand, = batched_args
  bdim, = batch_dims
  axes = tuple(onp.where(onp.less(axes, bdim), axes, onp.add(axes, 1)))
  bdim_out = list(onp.delete(onp.arange(operand.ndim), axes)).index(bdim)
  if 'input_shape' in kwargs:
    kwargs['input_shape'] = operand.shape
  return prim.bind(operand, axes=axes, **kwargs), bdim_out

# set up primitive batches for ad_util primitives

def add_batched(batched_args, batch_dims):
  bdx, bdy = batch_dims
  if bdx == bdy:
    xs, ys = batched_args
    return add_jaxvals_p.bind(xs, ys), bdx
  else:
    xs, ys = map(bdim_at_front, batched_args, batch_dims)
    return add_jaxvals_p.bind(xs, ys), 0
primitive_batchers[add_jaxvals_p] = add_batched

def zeros_like_batched(batched_args, batch_dims):
  val, = batched_args
  bdim, = batch_dims
  return zeros_like_jaxval(val), bdim
primitive_batchers[zeros_like_p] = zeros_like_batched


### util

# These utilities depend on primitives for things like broadcasting, reshaping,
# and transposition on arrays. To avoid a circular import from depending on
# lax.py, these functions use method dispatch on their arguments, which could be
# DeviceArrays, numpy.ndarrays, or traced versions of those. This strategy
# almost works, except for broadcast, for which raw numpy.ndarrays don't have a
# method. To handle that case, the `broadcast` function uses a try/except.


def bdim_at_front(x, bdim, broadcast_size=1):
  if bdim is None:
    return broadcast(x, broadcast_size)
  else:
    return move_dim_to_front(x, bdim)

def move_dim_to_front(x, dim):
  aval = get_aval(x)
  if type(aval) is AbstractTuple:
    return pack(map(partial(move_dim_to_front, dim=dim), x))
  elif isinstance(aval, ShapedArray):
    assert 0 <= dim < onp.ndim(x)
    if dim == 0:
      return x
    else:
      perm = (dim,) + tuple(range(dim)) + tuple(range(dim + 1, onp.ndim(x)))
      return x.transpose(perm)
  else:
    raise TypeError(type(x))

def dimsize(dim, x):
  aval = get_aval(x)
  if type(aval) is AbstractTuple:
    return reduce(set.union, map(partial(dimsize, dim), x))
  elif type(dim) is int:
    return {x.shape[dim]}
  elif dim is None:
    return set()
  else:
    raise TypeError(type(dim))

def moveaxis(sz, dst, src, x):
  aval = get_aval(x)
  if type(aval) is AbstractTuple:
    if type(src) is tuple and type(dst) is tuple:
      return pack(map(partial(moveaxis, sz), dst, src, x))
    elif type(src) is tuple:
      return pack(map(partial(moveaxis, sz, dst), src, x))
    elif type(dst) is tuple:
      srcs = (src,) * len(dst)
      return pack(map(partial(moveaxis, sz), dst, srcs, x))
    else:
      return pack(map(partial(moveaxis, sz, dst, src), x))
  elif isinstance(aval, ShapedArray):
    dst = (dst % aval.ndim) if dst is not None and aval.ndim else dst
    if src == dst:
      return x
    else:
      if src is None:
        x = broadcast(x, sz, force_broadcast=True)
        src = 0
      if src == dst:
        return x
      else:
        perm = [i for i in range(onp.ndim(x)) if i != src]
        perm.insert(dst, src)
        return x.transpose(perm)
  else:
    raise TypeError(type(aval))

def broadcast(x, sz, force_broadcast=False):
  aval = get_aval(x)
  if type(aval) is AbstractTuple:
    return pack(map(partial(broadcast, sz=sz), x))
  elif isinstance(aval, ShapedArray):
    # for scalars, maybe don't actually broadcast
    if not onp.ndim(x) and not force_broadcast:
      return x

    # see comment at the top of this section
    if isinstance(x, onp.ndarray) or onp.isscalar(x):
      return onp.broadcast_to(x, (sz,) + onp.shape(x))
    else:
      return x.broadcast((sz,))  # should be a JAX arraylike
  else:
    raise TypeError(type(x))

def handle_scalar_broadcasting(nd, x, bdim):
  assert isinstance(get_aval(x), ShapedArray)
  if bdim is None or nd == onp.ndim(x):
    return x
  else:
    return x.reshape(x.shape + (1,) * (nd - x.ndim))
populating source tree 2018-11-17 18:03:33 -08:00			`# Copyright 2018 Google LLC`
			`#`
			`# Licensed under the Apache License, Version 2.0 (the "License");`
			`# you may not use this file except in compliance with the License.`
			`# You may obtain a copy of the License at`
			`#`
			`# https://www.apache.org/licenses/LICENSE-2.0`
			`#`
			`# Unless required by applicable law or agreed to in writing, software`
			`# distributed under the License is distributed on an "AS IS" BASIS,`
			`# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`# See the License for the specific language governing permissions and`
			`# limitations under the License.`

source sync PiperOrigin-RevId: 222452709 2018-11-21 13:27:26 -08:00			`from __future__ import absolute_import`
			`from __future__ import division`
			`from __future__ import print_function`

populating source tree 2018-11-17 18:03:33 -08:00			`from collections import namedtuple`

			`import itertools as it`

			`import numpy as onp`

source sync PiperOrigin-RevId: 222451919 2018-11-21 13:20:44 -08:00			`from six.moves import reduce`

populating source tree 2018-11-17 18:03:33 -08:00			`from .. import core`
			`from ..core import Trace, Tracer, new_master, pack, AbstractTuple, JaxTuple`
			`from ..abstract_arrays import ShapedArray, make_shaped_array, array_types`
minor batching bugfixes exposed by general hessian 2019-01-07 08:34:48 -08:00			`from ..ad_util import add_jaxvals_p, zeros_like_p, zeros_like_jaxval`
populating source tree 2018-11-17 18:03:33 -08:00			`from ..linear_util import transformation, transformation_with_aux, wrap_init`
			`from ..tree_util import register_pytree_node`
			`from ..util import unzip2, partial, safe_map`

			`map = safe_map`


			`def batch(fun, in_vals, in_dims, out_dim_target):`
			`sizes = reduce(set.union, map(dimsize, in_dims, in_vals))`
			`if not sizes:`
			`return fun.call_wrapped(*in_vals), None # no mapped dimensions`
			`elif len(sizes) == 1:`
			`out_val, out_dim = batch_transform(fun).call_wrapped(in_vals, in_dims)`
			`return moveaxis(sizes.pop(), out_dim_target, out_dim, out_val)`
			`else:`
			`raise TypeError("got inconsistent map dimension sizes: {}".format(sizes))`


			`# TODO(mattjj,dougalm): could call batch_subtrace here (a bit redundant)`
			`@transformation`
			`def batch_transform(vals, dims):`
			`with new_master(BatchTrace) as master:`
			`trace = BatchTrace(master, core.cur_sublevel())`
			`in_tracers = map(partial(BatchTracer, trace), vals, dims)`
			`out_tracer = yield in_tracers`
			`out_tracer = trace.full_raise(out_tracer)`
			`out_val, out_dim = out_tracer.val, out_tracer.batch_dim`
			`del master`
			`yield (out_val, out_dim)`


			`@transformation_with_aux`
			`def batch_subtrace(master, dims, *vals):`
			`trace = BatchTrace(master, core.cur_sublevel())`
			`ans = yield map(partial(BatchTracer, trace), vals, dims)`
			`out_tracer = trace.full_raise(ans)`
			`out_val, out_dim = out_tracer.val, out_tracer.batch_dim`
			`yield out_val, out_dim`


			`### tracer`


			`class BatchTracer(Tracer):`
			`def __init__(self, trace, val, batch_dim):`
			`self.trace = trace`
			`self.val = val`
			`self.batch_dim = batch_dim`

			`@property`
			`def aval(self):`
			`batched_aval = get_aval(self.val)`
			`return remove_batch_dim_from_aval(self.batch_dim, batched_aval)`

			`def unpack(self):`
			`t = type(self.batch_dim)`
			`if t is tuple:`
			`batch_dims = self.batch_dim`
			`elif t is int:`
			`batch_dims = [self.batch_dim] * len(self.val)`
source sync PiperOrigin-RevId: 222500675 2018-11-21 22:49:34 -08:00			`elif t is type(None):`
			`return tuple(self.val)`
populating source tree 2018-11-17 18:03:33 -08:00			`else:`
source sync PiperOrigin-RevId: 222451919 2018-11-21 13:20:44 -08:00			`raise TypeError(t)`
populating source tree 2018-11-17 18:03:33 -08:00			`return map(partial(BatchTracer, self.trace), self.val, batch_dims)`

			`def full_lower(self):`
			`if self.batch_dim is None:`
			`return core.full_lower(self.val)`
			`else:`
			`return self`

			`class BatchTrace(Trace):`
			`def pure(self, val):`
			`return BatchTracer(self, val, None)`

			`def lift(self, val):`
			`return BatchTracer(self, val, None)`

			`def sublift(self, val):`
			`return BatchTracer(self, val.val, val.batch_dim)`

			`def process_primitive(self, primitive, tracers, params):`
			`vals_in, dims_in = unzip2((t.val, t.batch_dim) for t in tracers)`
			`if all(bdim is None for bdim in dims_in):`
			`return primitive.bind(vals_in, *params)`
			`else:`
			`batched_primitive = get_primitive_batcher(primitive)`
			`val_out, dim_out = batched_primitive(vals_in, dims_in, **params)`
			`return BatchTracer(self, val_out, dim_out)`

			`def process_call(self, call_primitive, f, tracers, params):`
			`vals, dims = unzip2((t.val, t.batch_dim) for t in tracers)`
			`if all(bdim is None for bdim in dims):`
			`return call_primitive.bind(f, vals, *params)`
			`else:`
			`f, dim_out = batch_subtrace(f, self.master, dims)`
			`val_out = call_primitive.bind(f, vals, *params)`
			`return BatchTracer(self, val_out, dim_out())`

			`def post_process_call(self, _, out_tracer):`
			`raise NotImplementedError # TODO(mattjj,dougalm)`

			`def pack(self, tracers):`
			`vals = pack([t.val for t in tracers])`
			`batch_dim = tuple(t.batch_dim for t in tracers)`
			`return BatchTracer(self, vals, batch_dim)`


			`### abstract values`


			`def get_aval(x):`
			`if isinstance(x, Tracer):`
			`return raise_to_shaped(x.aval)`
			`else:`
			`return shaped_aval(x)`

			`def shaped_aval(x):`
			`try:`
			`return pytype_aval_mappings[type(x)](x)`
			`except KeyError:`
			`raise TypeError("{} is not a valid type for batching".format(type(x)))`

			`def raise_to_shaped(aval):`
			`if type(aval) is AbstractTuple:`
			`return AbstractTuple(map(raise_to_shaped, aval))`
			`elif isinstance(aval, ShapedArray):`
			`return ShapedArray(aval.shape, aval.dtype)`
			`else:`
source sync PiperOrigin-RevId: 222451919 2018-11-21 13:20:44 -08:00			`raise TypeError(type(aval))`
populating source tree 2018-11-17 18:03:33 -08:00
			`def remove_batch_dim_from_aval(bdim, aval):`
			`t = type(aval)`
			`if t is AbstractTuple:`
			`if type(bdim) is tuple:`
			`return AbstractTuple(map(remove_batch_dim_from_aval, bdim, aval))`
			`else:`
			`return AbstractTuple(map(partial(remove_batch_dim_from_aval, bdim), aval))`
			`elif t is ShapedArray:`
			`if bdim is None:`
			`return ShapedArray(aval.shape, aval.dtype)`
			`else:`
			`assert 0 <= bdim < aval.ndim`
			`unbatched_shape = tuple(onp.delete(aval.shape, bdim))`
			`return ShapedArray(unbatched_shape, aval.dtype)`
			`else:`
source sync PiperOrigin-RevId: 222451919 2018-11-21 13:20:44 -08:00			`raise TypeError(t)`
populating source tree 2018-11-17 18:03:33 -08:00
			`pytype_aval_mappings = {}`

			`def shaped_jaxtuple(xs):`
			`return AbstractTuple(map(shaped_aval, xs))`

			`pytype_aval_mappings[JaxTuple] = shaped_jaxtuple`

			`for t in array_types:`
			`pytype_aval_mappings[t] = make_shaped_array`


			`### primitives`


			`primitive_batchers = {}`

			`def get_primitive_batcher(p):`
			`try:`
			`return primitive_batchers[p]`
			`except KeyError:`
			`raise NotImplementedError(`
			`"Batching rule for '{}' not implemented".format(p))`

			`def defvectorized(prim):`
			`primitive_batchers[prim] = partial(vectorized_batcher, prim)`

			`def vectorized_batcher(prim, batched_args, batch_dims, **params):`
			`assert all(batch_dims[0] == bd for bd in batch_dims[1:])`
			`return prim.bind(batched_args, *params), batch_dims[0]`

			`def defbroadcasting(prim):`
			`primitive_batchers[prim] = partial(broadcast_batcher, prim)`

			`def broadcast_batcher(prim, batched_args, batch_dims, **params):`
			`args = map(bdim_at_front, batched_args, batch_dims)`
			`ndim = max(map(onp.ndim, args)) # special case to handle scalar broadcasting`
			`args = map(partial(handle_scalar_broadcasting, ndim), args, batch_dims)`
			`return prim.bind(args, *params), 0`

			`def defreducer(prim):`
			`primitive_batchers[prim] = partial(reducer_batcher, prim)`

			`def reducer_batcher(prim, batched_args, batch_dims, axes, **kwargs):`
			`operand, = batched_args`
			`bdim, = batch_dims`
			`axes = tuple(onp.where(onp.less(axes, bdim), axes, onp.add(axes, 1)))`
			`bdim_out = list(onp.delete(onp.arange(operand.ndim), axes)).index(bdim)`
Fixed bug due to input_shape kwarg not being modified in batching rule for reducers. Fixes b/120595235 2018-12-06 22:45:49 -05:00			`if 'input_shape' in kwargs:`
			`kwargs['input_shape'] = operand.shape`
populating source tree 2018-11-17 18:03:33 -08:00			`return prim.bind(operand, axes=axes, **kwargs), bdim_out`

minor batching bugfixes exposed by general hessian 2019-01-07 08:34:48 -08:00			`# set up primitive batches for ad_util primitives`

populating source tree 2018-11-17 18:03:33 -08:00			`def add_batched(batched_args, batch_dims):`
			`bdx, bdy = batch_dims`
			`if bdx == bdy:`
cover unimplemented add_jaxvals_p batching case 2018-12-21 08:11:36 -08:00			`xs, ys = batched_args`
populating source tree 2018-11-17 18:03:33 -08:00			`return add_jaxvals_p.bind(xs, ys), bdx`
			`else:`
cover unimplemented add_jaxvals_p batching case 2018-12-21 08:11:36 -08:00			`xs, ys = map(bdim_at_front, batched_args, batch_dims)`
			`return add_jaxvals_p.bind(xs, ys), 0`
populating source tree 2018-11-17 18:03:33 -08:00			`primitive_batchers[add_jaxvals_p] = add_batched`

minor batching bugfixes exposed by general hessian 2019-01-07 08:34:48 -08:00			`def zeros_like_batched(batched_args, batch_dims):`
			`val, = batched_args`
			`bdim, = batch_dims`
			`return zeros_like_jaxval(val), bdim`
			`primitive_batchers[zeros_like_p] = zeros_like_batched`

populating source tree 2018-11-17 18:03:33 -08:00
			`### util`

cover unimplemented add_jaxvals_p batching case 2018-12-21 08:11:36 -08:00			`# These utilities depend on primitives for things like broadcasting, reshaping,`
			`# and transposition on arrays. To avoid a circular import from depending on`
			`# lax.py, these functions use method dispatch on their arguments, which could be`
			`# DeviceArrays, numpy.ndarrays, or traced versions of those. This strategy`
			`# almost works, except for broadcast, for which raw numpy.ndarrays don't have a`
			# method. To handle that case, the `broadcast` function uses a try/except.

populating source tree 2018-11-17 18:03:33 -08:00
			`def bdim_at_front(x, bdim, broadcast_size=1):`
			`if bdim is None:`
cover unimplemented add_jaxvals_p batching case 2018-12-21 08:11:36 -08:00			`return broadcast(x, broadcast_size)`
populating source tree 2018-11-17 18:03:33 -08:00			`else:`
			`return move_dim_to_front(x, bdim)`

			`def move_dim_to_front(x, dim):`
cover unimplemented add_jaxvals_p batching case 2018-12-21 08:11:36 -08:00			`aval = get_aval(x)`
			`if type(aval) is AbstractTuple:`
			`return pack(map(partial(move_dim_to_front, dim=dim), x))`
			`elif isinstance(aval, ShapedArray):`
			`assert 0 <= dim < onp.ndim(x)`
			`if dim == 0:`
			`return x`
			`else:`
			`perm = (dim,) + tuple(range(dim)) + tuple(range(dim + 1, onp.ndim(x)))`
			`return x.transpose(perm)`
populating source tree 2018-11-17 18:03:33 -08:00			`else:`
cover unimplemented add_jaxvals_p batching case 2018-12-21 08:11:36 -08:00			`raise TypeError(type(x))`
populating source tree 2018-11-17 18:03:33 -08:00
			`def dimsize(dim, x):`
cover unimplemented add_jaxvals_p batching case 2018-12-21 08:11:36 -08:00			`aval = get_aval(x)`
			`if type(aval) is AbstractTuple:`
populating source tree 2018-11-17 18:03:33 -08:00			`return reduce(set.union, map(partial(dimsize, dim), x))`
			`elif type(dim) is int:`
			`return {x.shape[dim]}`
			`elif dim is None:`
			`return set()`
			`else:`
source sync PiperOrigin-RevId: 222451919 2018-11-21 13:20:44 -08:00			`raise TypeError(type(dim))`
populating source tree 2018-11-17 18:03:33 -08:00
			`def moveaxis(sz, dst, src, x):`
			`aval = get_aval(x)`
			`if type(aval) is AbstractTuple:`
			`if type(src) is tuple and type(dst) is tuple:`
			`return pack(map(partial(moveaxis, sz), dst, src, x))`
			`elif type(src) is tuple:`
			`return pack(map(partial(moveaxis, sz, dst), src, x))`
minor batching bugfixes exposed by general hessian 2019-01-07 08:34:48 -08:00			`elif type(dst) is tuple:`
			`srcs = (src,) * len(dst)`
			`return pack(map(partial(moveaxis, sz), dst, srcs, x))`
populating source tree 2018-11-17 18:03:33 -08:00			`else:`
			`return pack(map(partial(moveaxis, sz, dst, src), x))`
			`elif isinstance(aval, ShapedArray):`
fix transpose issue in jacfwd and jacrev 2018-12-11 16:24:20 -08:00			`dst = (dst % aval.ndim) if dst is not None and aval.ndim else dst`
populating source tree 2018-11-17 18:03:33 -08:00			`if src == dst:`
			`return x`
			`else:`
			`if src is None:`
generalize jacfwd and jacrev to handle pytrees 2019-01-06 11:59:33 -08:00			`x = broadcast(x, sz, force_broadcast=True)`
populating source tree 2018-11-17 18:03:33 -08:00			`src = 0`
			`if src == dst:`
			`return x`
			`else:`
			`perm = [i for i in range(onp.ndim(x)) if i != src]`
			`perm.insert(dst, src)`
			`return x.transpose(perm)`
			`else:`
source sync PiperOrigin-RevId: 222451919 2018-11-21 13:20:44 -08:00			`raise TypeError(type(aval))`
populating source tree 2018-11-17 18:03:33 -08:00
generalize jacfwd and jacrev to handle pytrees 2019-01-06 11:59:33 -08:00			`def broadcast(x, sz, force_broadcast=False):`
cover unimplemented add_jaxvals_p batching case 2018-12-21 08:11:36 -08:00			`aval = get_aval(x)`
			`if type(aval) is AbstractTuple:`
			`return pack(map(partial(broadcast, sz=sz), x))`
			`elif isinstance(aval, ShapedArray):`
generalize jacfwd and jacrev to handle pytrees 2019-01-06 11:59:33 -08:00			`# for scalars, maybe don't actually broadcast`
			`if not onp.ndim(x) and not force_broadcast:`
cover unimplemented add_jaxvals_p batching case 2018-12-21 08:11:36 -08:00			`return x`

generalize jacfwd and jacrev to handle pytrees 2019-01-06 11:59:33 -08:00			`# see comment at the top of this section`
			`if isinstance(x, onp.ndarray) or onp.isscalar(x):`
cover unimplemented add_jaxvals_p batching case 2018-12-21 08:11:36 -08:00			`return onp.broadcast_to(x, (sz,) + onp.shape(x))`
generalize jacfwd and jacrev to handle pytrees 2019-01-06 11:59:33 -08:00			`else:`
			`return x.broadcast((sz,)) # should be a JAX arraylike`
cover unimplemented add_jaxvals_p batching case 2018-12-21 08:11:36 -08:00			`else:`
			`raise TypeError(type(x))`

			`def handle_scalar_broadcasting(nd, x, bdim):`
			`assert isinstance(get_aval(x), ShapedArray)`
			`if bdim is None or nd == onp.ndim(x):`
			`return x`
			`else:`
			`return x.reshape(x.shape + (1,) * (nd - x.ndim))`