rocm_jax/jax/experimental/array.py

# Copyright 2021 Google LLC
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     https://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

from __future__ import annotations

import operator as op
import numpy as np
from typing import Sequence, Tuple, Callable, Union, Optional, cast, List

from jax import core
from jax._src import abstract_arrays
from jax._src import ad_util
from jax._src import api_util
from jax._src import dispatch
from jax._src import dtypes
from jax._src.lax import lax as lax_internal
from jax._src.config import config
from jax._src.util import prod, safe_zip
from jax._src.lib import xla_client as xc
from jax._src.api import device_put
from jax._src.numpy.ndarray import ndarray
from jax.interpreters import pxla, xla, mlir
from jax.experimental.sharding import (Sharding, SingleDeviceSharding,
                                       XLACompatibleSharding)

Shape = Tuple[int, ...]
Device = xc.Device
DeviceArray = xc.Buffer
Index = Tuple[slice, ...]
ArrayLike = Union[np.ndarray, DeviceArray]


class Shard:
  """A single data shard of an Array.

  Attributes:
    device : Which device this shard resides on.
    index : The index into the global array of this shard.
    replica_id : Integer id indicating which replica of the global array this
      shard is part of. Always 0 for fully sharded data
      (i.e. when there’s only 1 replica).
    data : The data of this shard. None if ``device`` is non-local.
  """

  def __init__(self, device: Device, sharding: Sharding, global_shape: Shape,
               data: Optional[Array] = None):
    self.device = device
    self._sharding = sharding
    self._global_shape = global_shape
    self.data = data

  def __repr__(self):
    try:
      return (f'Shard(device={repr(self.device)}, index={self.index}, '
              f'replica_id={self.replica_id}, data={self.data})')
    except ValueError:
      return f'Shard(device={repr(self.device)}, data={self.data})'

  @property
  def index(self) -> Index:
    try:
      device_indices_fn = self._sharding.device_indices
    except AttributeError:
      raise ValueError('Cannot calculate indices from sharding: '
                       f'{self._sharding}. Please create a device to index '
                       'mapping for your sharding.') from None
    index = device_indices_fn(self.device, self._global_shape)
    assert index is not None
    return index

  @property
  def replica_id(self) -> int:
    try:
      device_replica_id_fn = self._sharding.device_replica_id_map  # pytype: disable=attribute-error
    except AttributeError:
      raise ValueError('Cannot calculate replica ids from sharding: '
                       f'{self._sharding}. Please create a device to replica id '
                       'mapping for your sharding.') from None
    return device_replica_id_fn(self._global_shape)[self.device]


def _reconstruct_array(fun, args, arr_state, aval_state):
  """Method to reconstruct a device array from a serialized state."""
  np_value = fun(*args)
  np_value.__setstate__(arr_state)
  jnp_value = device_put(np_value)
  jnp_value.aval = jnp_value.aval.update(**aval_state)
  return jnp_value


class Array:
  # TODO(yashkatariya): Add __slots__ here.

  def __init__(self, aval: core.ShapedArray, sharding: Sharding,
               arrays: Union[Sequence[DeviceArray], Sequence[Array]],
               committed: bool, _skip_checks: bool = False):
    self.aval = aval
    self._sharding = sharding
    # Extract DeviceArrays from arrays with `SingleDeviceSharding` to keep the
    # code handling `self._arrays` simpler.
    # TODO(yashkatariya): This will be slower as it will happen during
    # `__init__` on single controller environment. Make it lazy.
    self._arrays: List[DeviceArray] = [a if isinstance(a, DeviceArray) else a._arrays[0]
                                       for a in arrays]
    # See https://jax.readthedocs.io/en/latest/faq.html#controlling-data-and-computation-placement-on-devices
    # for what committed means.
    self._committed = committed
    self._npy_value = None

    # TODO(yashkatariya): Add a check here which checks if the expected shard
    # shape matches the shape of _arrays. A similar check exists for GDA.

    if not _skip_checks or config.jax_enable_checks:
      assert all(db.dtype == self.dtype for db in self._arrays), (
          "Input arrays to `Array` must have matching dtypes, "
          f"got: {[db.dtype for db in self._arrays]}, aval type: {self.dtype}")

    # Don't rearrange if skip_checks is enabled because this assumes that the
    # input buffers are already arranged properly. This usually happens when
    # Array's are created as output of a JAX transformation
    # (like pjit, xmap, etc).
    if not _skip_checks:
      addressable_device_assignment = self.sharding._addressable_device_assignment
      # Rearrange arrays based on the device assignment.
      if isinstance(sharding, XLACompatibleSharding):
        if len(self._arrays) != len(addressable_device_assignment):
          raise ValueError(
              f"Expected {len(addressable_device_assignment)} per-device arrays "
              "(this is how many devices are addressable by the sharding), but "
              f"got {len(self._arrays)}")
        device_to_buffer = {db.device().id: db for db in self._arrays}
        try:
          self._arrays = [device_to_buffer[device.id]
                          for device in addressable_device_assignment]
        except KeyError as e:
          array_device_ids = set(a.device().id for a in self._arrays)
          addressable_device_ids = set(d.id for d in addressable_device_assignment)
          diff = set(array_device_ids) - set(addressable_device_ids)
          raise ValueError(
              f"Some per-device arrays are placed on devices {diff}, which are "
              f"not used in the specified sharding {self.sharding}") from e

  @property
  def shape(self) -> Shape:
    return self.aval.shape

  @property
  def dtype(self):
    return self.aval.dtype

  @property
  def ndim(self):
    return len(self.shape)

  @property
  def size(self):
    return prod(self.shape)

  @property
  def sharding(self):
    return self._sharding

  def __str__(self):
    return str(self._value)

  def __len__(self):
    try:
      return self.shape[0]
    except IndexError as err:
      raise TypeError("len() of unsized object") from err  # same as numpy error

  def __bool__(self):
    return bool(self._value)

  def __nonzero__(self):
    return bool(self._value)

  def __float__(self):
    return self._value.__float__()

  def __int__(self):
    return self._value.__int__()

  def __complex__(self):
    return self._value.__complex__()

  def __hex__(self):
    assert self.ndim == 0, 'hex only works on scalar values'
    return hex(self._value)  # type: ignore

  def __oct__(self):
    assert self.ndim == 0, 'oct only works on scalar values'
    return oct(self._value)  # type: ignore

  def __index__(self):
    return op.index(self._value)

  def tobytes(self, order="C"):
    return self._value.tobytes(order)

  def tolist(self):
    return self._value.tolist()

  def __format__(self, format_spec):
    # Simulates behavior of https://github.com/numpy/numpy/pull/9883
    if self.ndim == 0:
      return format(self._value[()], format_spec)
    else:
      return format(self._value, format_spec)

  def __iter__(self):
    if self.ndim == 0:
      raise TypeError("iteration over a 0-d array")  # same as numpy error
    else:
      # chunk_iter is added to Array in lax_numpy.py similar to DA.
      return (sl for chunk in self._chunk_iter(100) for sl in chunk._unstack())  # type: ignore

  def item(self):
    if dtypes.issubdtype(self.dtype, np.complexfloating):
      return complex(self)
    elif dtypes.issubdtype(self.dtype, np.floating):
      return float(self)
    elif dtypes.issubdtype(self.dtype, np.integer):
      return int(self)
    elif dtypes.issubdtype(self.dtype, np.bool_):
      return bool(self)
    else:
      raise TypeError(self.dtype)

  def is_fully_replicated(self) -> bool:
    return self.shape == self._arrays[0].shape

  def __repr__(self):
    prefix = '{}('.format(self.__class__.__name__.lstrip('_'))
    if self.aval is not None and self.aval.weak_type:
      dtype_str = f'dtype={self.dtype.name}, weak_type=True)'
    else:
      dtype_str = f'dtype={self.dtype.name})'

    if self.is_fully_addressable() or self.is_fully_replicated():
      line_width = np.get_printoptions()["linewidth"]
      s = np.array2string(self._value, prefix=prefix, suffix=',',
                          separator=', ', max_line_width=line_width)
      last_line_len = len(s) - s.rfind('\n') + 1
      sep = ' '
      if last_line_len + len(dtype_str) + 1 > line_width:
        sep = ' ' * len(prefix)
      return f"{prefix}{s},{sep}{dtype_str}"
    else:
      return f"{prefix}{self.shape}, {dtype_str}"

  def is_fully_addressable(self) -> bool:
    return self.sharding.is_fully_addressable()

  def __array__(self, dtype=None, context=None):
    return np.asarray(self._value, dtype=dtype)

  def __dlpack__(self):
    from jax.dlpack import to_dlpack  # pylint: disable=g-import-not-at-top
    return to_dlpack(self)

  def __reduce__(self):
    fun, args, arr_state = self._value.__reduce__()
    aval_state = {'weak_type': self.aval.weak_type,
                  'named_shape': self.aval.named_shape}
    return (_reconstruct_array, (fun, args, arr_state, aval_state))

  # TODO(yashkatariya): Remove this method when everyone is using devices().
  def device(self) -> Device:
    self._check_if_deleted()
    device_set = self.sharding.device_set
    if len(device_set) == 1:
      single_device, = device_set
      return single_device
    raise ValueError('Length of devices is greater than 1. '
                     'Please use `.devices()`.')

  def devices(self) -> List[Device]:
    self._check_if_deleted()
    return list(self.sharding.device_set)

  @pxla.maybe_cached_property
  def addressable_shards(self) -> Sequence[Shard]:
    self._check_if_deleted()
    out = []
    for db in self._arrays:
      db = pxla._set_aval(db)
      device = db.device()
      # Wrap the device arrays in `Array` until C++ returns an Array instead
      # of a DA.
      array = Array(db.aval, SingleDeviceSharding(device), [db], committed=True,
                    _skip_checks=True)
      out.append(Shard(device, self.sharding, self.shape, array))
    return out

  def delete(self):
    if self._arrays is None:
      return
    for buf in self._arrays:
      buf.delete()
    self._arrays = None
    self._npy_value = None

  def is_deleted(self):
    return all(buf.is_deleted() for buf in self._arrays)

  def _check_if_deleted(self):
    if self._arrays is None:
      raise RuntimeError("Array has been deleted.")

  def block_until_ready(self):
    self._check_if_deleted()
    for db in self._arrays:
      db.block_until_ready()
    return self

  def copy_to_host_async(self):
    self._check_if_deleted()
    if self._npy_value is None:
      try:
        self.addressable_shards[0].replica_id
        replica_id_exists = True
      except ValueError:
        replica_id_exists = False

      for s in self.addressable_shards:
        if not replica_id_exists or s.replica_id == 0:
          s.data._arrays[0].copy_to_host_async()  # pytype: disable=attribute-error

  @property
  def _value(self) -> np.ndarray:
    self._check_if_deleted()

    if self._npy_value is None:
      if self.is_fully_replicated():
        self._npy_value = np.asarray(self._arrays[0])  # type: ignore
        return cast(np.ndarray, self._npy_value)

      if not self.is_fully_addressable():
        raise RuntimeError("Fetching value for `jax.Array` that spans "
                           "non-addressable devices is not possible. You can use "
                           "`jax.experimental.multihost_utils.process_allgather` "
                           "for this use case.")

      self.copy_to_host_async()
      npy_value = np.empty(self.shape, self.dtype)

      try:
        self.addressable_shards[0].replica_id
        replica_id_exists = True
      except ValueError:
        replica_id_exists = False

      for s in self.addressable_shards:
        if not replica_id_exists or s.replica_id == 0:
          npy_value[s.index] = np.asarray(s.data._arrays[0])  # type: ignore  # [union-attr]
      self._npy_value = npy_value  # type: ignore
    # https://docs.python.org/3/library/typing.html#typing.cast
    return cast(np.ndarray, self._npy_value)

# explicitly set to be unhashable. Same as what device_array.py does.
setattr(Array, "__hash__", None)

def make_array_from_callback(shape: Shape, sharding: Sharding,
                             data_callback: Callable[[Optional[Index]], ArrayLike]) -> Array:
  arrays = [
      device_put(data_callback(sharding.device_indices(device, shape)), device)
      for device in sharding.addressable_devices
  ]
  aval = core.ShapedArray(shape, arrays[0].dtype, weak_type=False)
  return Array(aval, sharding, arrays, committed=True)


core.pytype_aval_mappings[Array] = abstract_arrays.canonical_concrete_aval
xla.pytype_aval_mappings[Array] = op.attrgetter('aval')
xla.canonicalize_dtype_handlers[Array] = pxla.identity
api_util._shaped_abstractify_handlers[Array] = op.attrgetter('aval')
ad_util.jaxval_adders[Array] = lax_internal.add
ad_util.jaxval_zeros_likers[Array] = lax_internal.zeros_like_array
ndarray.register(Array)


def _array_mlir_constant_handler(val, canonicalize_types=True):
  return mlir.ir_constants(val._value,
                           canonicalize_types=canonicalize_types)
mlir.register_constant_handler(Array, _array_mlir_constant_handler)


def _device_put_array(x, device: Optional[Device]):
  # TODO(yashkatariya): Remove this restriction and the round trip via host
  # once lowering to XLA goes through `lower_mesh_computation`.
  assert x.is_fully_addressable()
  if isinstance(x.sharding, SingleDeviceSharding):
    x = dispatch._copy_device_array_to_device(pxla._set_aval(x._arrays[0]), device)
    return (x,)
  else:
    # Round trip via host if x is sharded. SDA also does a round trip via host.
    return dispatch._device_put_array(x._value, device)

dispatch.device_put_handlers[Array] = _device_put_array


def _array_pmap_shard_arg(x, devices, indices, mode):
  if isinstance(x.sharding, SingleDeviceSharding):
    return pxla._shard_device_array(x, devices, indices, mode)

  # If the sharding of Array does not match pmap's sharding then take the slow
  # path which is similar to what SDA does. This slow path reroute only happens
  # for `pmap`.
  if indices == tuple(x.sharding.devices_indices_map(x.shape).values()):
    return [buf if buf.device() == d else buf.copy_to_device(d)
            for buf, d in safe_zip(x._arrays, devices)]
  else:
    return pxla._shard_sharded_device_array_slow_path(x, devices, indices, mode)


def _array_shard_arg(x, devices, indices, mode):
  if mode == pxla.InputsHandlerMode.pmap:
    return _array_pmap_shard_arg(x, devices, indices, mode)
  else:
    return x._arrays
pxla.shard_arg_handlers[Array] = _array_shard_arg


def _array_global_result_handler(global_aval, out_sharding):
  if core.aval_has_custom_eltype(global_aval):
    return global_aval.dtype.global_sharded_result_handler(
        global_aval, out_sharding)
  else:
    return lambda bufs: Array(global_aval, out_sharding, bufs, committed=True,
                              _skip_checks=True)
pxla.global_result_handlers[(core.ShapedArray, pxla.OutputType.Array)] = _array_global_result_handler
pxla.global_result_handlers[(core.ConcreteArray, pxla.OutputType.Array)] = _array_global_result_handler


def _array_local_result_handler(aval, sharding, indices):
  if core.aval_has_custom_eltype(aval):
    return aval.dtype.local_sharded_result_handler(aval, sharding, indices)
  else:
    return lambda bufs: Array(aval, sharding, bufs, committed=True,
                              _skip_checks=True)
pxla.local_result_handlers[(core.ShapedArray, pxla.OutputType.Array)] = _array_local_result_handler
pxla.local_result_handlers[(core.ConcreteArray, pxla.OutputType.Array)] = _array_local_result_handler
-												Adding `jax.Array` to jax.experimental. Its pretty much the same as GDA (without the performance optimization for now).

Currently, jax.Array takes DeviceArrays in `assemble_array` because device_put returns a DA. In the future (with IFRT), it will return an `Array`.

`addressable_shards` wraps DA into jax.Array with a `SingleDeviceSharding`.

PiperOrigin-RevId: 453319811

											
										
										
											2022-06-06 17:31:20 -07:00
+								# Copyright 2021 Google LLC
 								#
 								# Licensed under the Apache License, Version 2.0 (the "License");
 								# you may not use this file except in compliance with the License.
 								# You may obtain a copy of the License at
 								#
 								#     https://www.apache.org/licenses/LICENSE-2.0
 								#
 								# Unless required by applicable law or agreed to in writing, software
 								# distributed under the License is distributed on an "AS IS" BASIS,
 								# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 								# See the License for the specific language governing permissions and
 								# limitations under the License.
 								from __future__ import annotations
-												Add weak type support to Array. Also make all api_test.py tests pass with Array. I have disabled the `float0` test for now until I investigate.

PiperOrigin-RevId: 468264910

											
										
										
											2022-08-17 12:25:14 -07:00
+								import operator as op
-												Adding `jax.Array` to jax.experimental. Its pretty much the same as GDA (without the performance optimization for now).

Currently, jax.Array takes DeviceArrays in `assemble_array` because device_put returns a DA. In the future (with IFRT), it will return an `Array`.

`addressable_shards` wraps DA into jax.Array with a `SingleDeviceSharding`.

PiperOrigin-RevId: 453319811

											
										
										
											2022-06-06 17:31:20 -07:00
+								import numpy as np
-												Return `Array` from `jax.device_put` if `config.jax_array` is enabled.

PiperOrigin-RevId: 456531510

											
										
										
											2022-06-22 09:20:26 -07:00
+								from typing import Sequence, Tuple, Callable, Union, Optional, cast, List
-												Adding `jax.Array` to jax.experimental. Its pretty much the same as GDA (without the performance optimization for now).

Currently, jax.Array takes DeviceArrays in `assemble_array` because device_put returns a DA. In the future (with IFRT), it will return an `Array`.

`addressable_shards` wraps DA into jax.Array with a `SingleDeviceSharding`.

PiperOrigin-RevId: 453319811

											
										
										
											2022-06-06 17:31:20 -07:00
-												Add pjit support for `Array`. `Array` takes the same codepath as GDA so there are very little modifications to pjit. Add handlers aval, shard_args and result handlers for Array.

PiperOrigin-RevId: 454160854

											
										
										
											2022-06-10 07:31:43 -07:00
+								from jax import core
-												Array bug: make pytype_aval_mapping return a ConcreteShapedArray

											
										
										
											2022-08-18 12:31:30 -07:00
+								from jax._src import abstract_arrays
-												Make all pmap tests pass with Array! I am skipping all soft pmap tests for now.

PiperOrigin-RevId: 467264992

											
										
										
											2022-08-12 12:09:22 -07:00
+								from jax._src import ad_util
-												add an optional fastpath for api_util.shaped_abstractify

also add a benchmark for it, 8.7ms -> 0.2ms on my machine

Co-authored-by: Yash Katariya <yashkatariya@google.com>

											
										
										
											2022-07-27 10:54:54 -07:00
+								from jax._src import api_util
-												Make `jnp.array` return `jax.Array`. Add input and result handlers for `jax.Array`. Also added tests for `add` under jit.

TODO:
* Don't allow `x + y` if `jax.Array` is not fully addressable.
* Figure out how to use the already written tests with Array. Might be able to follow the path taken by SDA.
PiperOrigin-RevId: 457034779

											
										
										
											2022-06-24 10:04:31 -07:00
+								from jax._src import dispatch
-												Make checkify tests pass with Array and add methods on Array that are present on DA.

PiperOrigin-RevId: 468058909

											
										
										
											2022-08-16 16:51:26 -07:00
+								from jax._src import dtypes
-												Make all pmap tests pass with Array! I am skipping all soft pmap tests for now.

PiperOrigin-RevId: 467264992

											
										
										
											2022-08-12 12:09:22 -07:00
+								from jax._src.lax import lax as lax_internal
-												Adding `jax.Array` to jax.experimental. Its pretty much the same as GDA (without the performance optimization for now).

Currently, jax.Array takes DeviceArrays in `assemble_array` because device_put returns a DA. In the future (with IFRT), it will return an `Array`.

`addressable_shards` wraps DA into jax.Array with a `SingleDeviceSharding`.

PiperOrigin-RevId: 453319811

											
										
										
											2022-06-06 17:31:20 -07:00
+								from jax._src.config import config
-												Pmap should output SDA like `Array`s to maintain the current behavior exactly. Split the shard_arg_handler for `Array` based on whether the mode is pmap or pjit. Why do this? The doc below explains more about the context.

PiperOrigin-RevId: 466849614

											
										
										
											2022-08-10 20:11:06 -07:00
+								from jax._src.util import prod, safe_zip
-												Adding `jax.Array` to jax.experimental. Its pretty much the same as GDA (without the performance optimization for now).

Currently, jax.Array takes DeviceArrays in `assemble_array` because device_put returns a DA. In the future (with IFRT), it will return an `Array`.

`addressable_shards` wraps DA into jax.Array with a `SingleDeviceSharding`.

PiperOrigin-RevId: 453319811

											
										
										
											2022-06-06 17:31:20 -07:00
+								from jax._src.lib import xla_client as xc
 								from jax._src.api import device_put
-												Avoid import-time dependency on jax.experimental

											
										
										
											2022-08-19 11:30:25 -07:00
+								from jax._src.numpy.ndarray import ndarray
-												Make all pmap tests pass with Array! I am skipping all soft pmap tests for now.

PiperOrigin-RevId: 467264992

											
										
										
											2022-08-12 12:09:22 -07:00
+								from jax.interpreters import pxla, xla, mlir
-												Add pjit support for `Array`. `Array` takes the same codepath as GDA so there are very little modifications to pjit. Add handlers aval, shard_args and result handlers for Array.

PiperOrigin-RevId: 454160854

											
										
										
											2022-06-10 07:31:43 -07:00
+								from jax.experimental.sharding import (Sharding, SingleDeviceSharding,
-												Return `Array` from `jax.device_put` if `config.jax_array` is enabled.

PiperOrigin-RevId: 456531510

											
										
										
											2022-06-22 09:20:26 -07:00
+								                                       XLACompatibleSharding)
-												Adding `jax.Array` to jax.experimental. Its pretty much the same as GDA (without the performance optimization for now).

Currently, jax.Array takes DeviceArrays in `assemble_array` because device_put returns a DA. In the future (with IFRT), it will return an `Array`.

`addressable_shards` wraps DA into jax.Array with a `SingleDeviceSharding`.

PiperOrigin-RevId: 453319811

											
										
										
											2022-06-06 17:31:20 -07:00
 								Shape = Tuple[int, ...]
 								Device = xc.Device
 								DeviceArray = xc.Buffer
 								Index = Tuple[slice, ...]
 								ArrayLike = Union[np.ndarray, DeviceArray]
-												Add the Shard class from GDA to `jax.Array` to make the management of shards easier and less verbose.

PiperOrigin-RevId: 453330349

											
										
										
											2022-06-06 18:44:45 -07:00
+								class Shard:
 								  """A single data shard of an Array.
-												Make `Shard` a normal class making `index` and `replica_id` properties on that class. Raise an error if an indices cannot be calculated from a sharding.

PiperOrigin-RevId: 454899275

											
										
										
											2022-06-14 10:34:19 -07:00
+								  Attributes:
-												Add the Shard class from GDA to `jax.Array` to make the management of shards easier and less verbose.

PiperOrigin-RevId: 453330349

											
										
										
											2022-06-06 18:44:45 -07:00
+								    device : Which device this shard resides on.
 								    index : The index into the global array of this shard.
 								    replica_id : Integer id indicating which replica of the global array this
 								      shard is part of. Always 0 for fully sharded data
 								      (i.e. when there’s only 1 replica).
 								    data : The data of this shard. None if ``device`` is non-local.
 								  """
-												Make `Shard` a normal class making `index` and `replica_id` properties on that class. Raise an error if an indices cannot be calculated from a sharding.

PiperOrigin-RevId: 454899275

											
										
										
											2022-06-14 10:34:19 -07:00
 								  def __init__(self, device: Device, sharding: Sharding, global_shape: Shape,
 								               data: Optional[Array] = None):
 								    self.device = device
 								    self._sharding = sharding
 								    self._global_shape = global_shape
 								    self.data = data
-												Add `__repr__` to Shard since its not a dataclass anymore

PiperOrigin-RevId: 456463979

											
										
										
											2022-06-22 02:25:34 -07:00
+								  def __repr__(self):
 								    try:
 								      return (f'Shard(device={repr(self.device)}, index={self.index}, '
 								              f'replica_id={self.replica_id}, data={self.data})')
 								    except ValueError:
 								      return f'Shard(device={repr(self.device)}, data={self.data})'
-												Make `Shard` a normal class making `index` and `replica_id` properties on that class. Raise an error if an indices cannot be calculated from a sharding.

PiperOrigin-RevId: 454899275

											
										
										
											2022-06-14 10:34:19 -07:00
+								  @property
 								  def index(self) -> Index:
 								    try:
 								      device_indices_fn = self._sharding.device_indices
 								    except AttributeError:
 								      raise ValueError('Cannot calculate indices from sharding: '
 								                       f'{self._sharding}. Please create a device to index '
 								                       'mapping for your sharding.') from None
 								    index = device_indices_fn(self.device, self._global_shape)
 								    assert index is not None
 								    return index
 								  @property
 								  def replica_id(self) -> int:
 								    try:
 								      device_replica_id_fn = self._sharding.device_replica_id_map  # pytype: disable=attribute-error
 								    except AttributeError:
 								      raise ValueError('Cannot calculate replica ids from sharding: '
 								                       f'{self._sharding}. Please create a device to replica id '
 								                       'mapping for your sharding.') from None
 								    return device_replica_id_fn(self._global_shape)[self.device]
-												Add the Shard class from GDA to `jax.Array` to make the management of shards easier and less verbose.

PiperOrigin-RevId: 453330349

											
										
										
											2022-06-06 18:44:45 -07:00
-												Add support for interoperability via dlpack for Array and also make pickle_tests and lax_numpy_test pass with Array.

PiperOrigin-RevId: 468568917

											
										
										
											2022-08-18 15:58:40 -07:00
+								def _reconstruct_array(fun, args, arr_state, aval_state):
 								  """Method to reconstruct a device array from a serialized state."""
 								  np_value = fun(*args)
 								  np_value.__setstate__(arr_state)
 								  jnp_value = device_put(np_value)
 								  jnp_value.aval = jnp_value.aval.update(**aval_state)
 								  return jnp_value
-												Adding `jax.Array` to jax.experimental. Its pretty much the same as GDA (without the performance optimization for now).

Currently, jax.Array takes DeviceArrays in `assemble_array` because device_put returns a DA. In the future (with IFRT), it will return an `Array`.

`addressable_shards` wraps DA into jax.Array with a `SingleDeviceSharding`.

PiperOrigin-RevId: 453319811

											
										
										
											2022-06-06 17:31:20 -07:00
+								class Array:
 								  # TODO(yashkatariya): Add __slots__ here.
-												Add weak type support to Array. Also make all api_test.py tests pass with Array. I have disabled the `float0` test for now until I investigate.

PiperOrigin-RevId: 468264910

											
										
										
											2022-08-17 12:25:14 -07:00
+								  def __init__(self, aval: core.ShapedArray, sharding: Sharding,
-												Enable fast path in the Array constructor. This means that the rearranging of `_arrays` according to the device_assignment won't happen when fastpath is enabled because we assume that jax transformations will return the right arrangement.

PiperOrigin-RevId: 469492283

											
										
										
											2022-08-23 10:19:59 -07:00
+								               arrays: Union[Sequence[DeviceArray], Sequence[Array]],
 								               committed: bool, _skip_checks: bool = False):
-												Add weak type support to Array. Also make all api_test.py tests pass with Array. I have disabled the `float0` test for now until I investigate.

PiperOrigin-RevId: 468264910

											
										
										
											2022-08-17 12:25:14 -07:00
+								    self.aval = aval
-												Adding `jax.Array` to jax.experimental. Its pretty much the same as GDA (without the performance optimization for now).

Currently, jax.Array takes DeviceArrays in `assemble_array` because device_put returns a DA. In the future (with IFRT), it will return an `Array`.

`addressable_shards` wraps DA into jax.Array with a `SingleDeviceSharding`.

PiperOrigin-RevId: 453319811

											
										
										
											2022-06-06 17:31:20 -07:00
+								    self._sharding = sharding
-												Return `Array` from `jax.device_put` if `config.jax_array` is enabled.

PiperOrigin-RevId: 456531510

											
										
										
											2022-06-22 09:20:26 -07:00
+								    # Extract DeviceArrays from arrays with `SingleDeviceSharding` to keep the
 								    # code handling `self._arrays` simpler.
 								    # TODO(yashkatariya): This will be slower as it will happen during
 								    # `__init__` on single controller environment. Make it lazy.
 								    self._arrays: List[DeviceArray] = [a if isinstance(a, DeviceArray) else a._arrays[0]
 								                                       for a in arrays]
-												Adding `jax.Array` to jax.experimental. Its pretty much the same as GDA (without the performance optimization for now).

Currently, jax.Array takes DeviceArrays in `assemble_array` because device_put returns a DA. In the future (with IFRT), it will return an `Array`.

`addressable_shards` wraps DA into jax.Array with a `SingleDeviceSharding`.

PiperOrigin-RevId: 453319811

											
										
										
											2022-06-06 17:31:20 -07:00
+								    # See https://jax.readthedocs.io/en/latest/faq.html#controlling-data-and-computation-placement-on-devices
 								    # for what committed means.
 								    self._committed = committed
-												Add `__array__` (for device_get), `_npy_value`, `block_until_ready`, `delete` and `_check_if_deleted` to Array.

PiperOrigin-RevId: 454741685

											
										
										
											2022-06-13 18:07:55 -07:00
+								    self._npy_value = None
-												Adding `jax.Array` to jax.experimental. Its pretty much the same as GDA (without the performance optimization for now).

Currently, jax.Array takes DeviceArrays in `assemble_array` because device_put returns a DA. In the future (with IFRT), it will return an `Array`.

`addressable_shards` wraps DA into jax.Array with a `SingleDeviceSharding`.

PiperOrigin-RevId: 453319811

											
										
										
											2022-06-06 17:31:20 -07:00
-												`__repr__` if an Array is fully replicated. Its the same for `_value` so it makes sense to do the same for `__repr__`.

PiperOrigin-RevId: 469892350

											
										
										
											2022-08-24 20:41:48 -07:00
+								    # TODO(yashkatariya): Add a check here which checks if the expected shard
 								    # shape matches the shape of _arrays. A similar check exists for GDA.
 								    if not _skip_checks or config.jax_enable_checks:
-												Add weak type support to Array. Also make all api_test.py tests pass with Array. I have disabled the `float0` test for now until I investigate.

PiperOrigin-RevId: 468264910

											
										
										
											2022-08-17 12:25:14 -07:00
+								      assert all(db.dtype == self.dtype for db in self._arrays), (
-												Adding `jax.Array` to jax.experimental. Its pretty much the same as GDA (without the performance optimization for now).

Currently, jax.Array takes DeviceArrays in `assemble_array` because device_put returns a DA. In the future (with IFRT), it will return an `Array`.

`addressable_shards` wraps DA into jax.Array with a `SingleDeviceSharding`.

PiperOrigin-RevId: 453319811

											
										
										
											2022-06-06 17:31:20 -07:00
+								          "Input arrays to `Array` must have matching dtypes, "
-												Make eager pmap tests pass with `Array`. Also add a slow path for Array in `pmap` similar to what SDA has. This is required for eager pmap. Adding a slow path removes the need for doing sharding checks in api.py because SDA doesn't do those checks and if the sharding does not match with pmap sharding, then it just defaults to the slow path (exactly like SDA).

PiperOrigin-RevId: 468843310

											
										
										
											2022-08-19 21:36:43 -07:00
+								          f"got: {[db.dtype for db in self._arrays]}, aval type: {self.dtype}")
-												Adding `jax.Array` to jax.experimental. Its pretty much the same as GDA (without the performance optimization for now).

Currently, jax.Array takes DeviceArrays in `assemble_array` because device_put returns a DA. In the future (with IFRT), it will return an `Array`.

`addressable_shards` wraps DA into jax.Array with a `SingleDeviceSharding`.

PiperOrigin-RevId: 453319811

											
										
										
											2022-06-06 17:31:20 -07:00
-												Enable fast path in the Array constructor. This means that the rearranging of `_arrays` according to the device_assignment won't happen when fastpath is enabled because we assume that jax transformations will return the right arrangement.

PiperOrigin-RevId: 469492283

											
										
										
											2022-08-23 10:19:59 -07:00
+								    # Don't rearrange if skip_checks is enabled because this assumes that the
 								    # input buffers are already arranged properly. This usually happens when
 								    # Array's are created as output of a JAX transformation
 								    # (like pjit, xmap, etc).
 								    if not _skip_checks:
 								      addressable_device_assignment = self.sharding._addressable_device_assignment
 								      # Rearrange arrays based on the device assignment.
 								      if isinstance(sharding, XLACompatibleSharding):
 								        if len(self._arrays) != len(addressable_device_assignment):
 								          raise ValueError(
 								              f"Expected {len(addressable_device_assignment)} per-device arrays "
 								              "(this is how many devices are addressable by the sharding), but "
 								              f"got {len(self._arrays)}")
 								        device_to_buffer = {db.device().id: db for db in self._arrays}
 								        try:
 								          self._arrays = [device_to_buffer[device.id]
 								                          for device in addressable_device_assignment]
 								        except KeyError as e:
 								          array_device_ids = set(a.device().id for a in self._arrays)
 								          addressable_device_ids = set(d.id for d in addressable_device_assignment)
 								          diff = set(array_device_ids) - set(addressable_device_ids)
 								          raise ValueError(
 								              f"Some per-device arrays are placed on devices {diff}, which are "
 								              f"not used in the specified sharding {self.sharding}") from e
-												Adding `jax.Array` to jax.experimental. Its pretty much the same as GDA (without the performance optimization for now).

Currently, jax.Array takes DeviceArrays in `assemble_array` because device_put returns a DA. In the future (with IFRT), it will return an `Array`.

`addressable_shards` wraps DA into jax.Array with a `SingleDeviceSharding`.

PiperOrigin-RevId: 453319811

											
										
										
											2022-06-06 17:31:20 -07:00
 								  @property
 								  def shape(self) -> Shape:
-												Add weak type support to Array. Also make all api_test.py tests pass with Array. I have disabled the `float0` test for now until I investigate.

PiperOrigin-RevId: 468264910

											
										
										
											2022-08-17 12:25:14 -07:00
+								    return self.aval.shape
-												Adding `jax.Array` to jax.experimental. Its pretty much the same as GDA (without the performance optimization for now).

Currently, jax.Array takes DeviceArrays in `assemble_array` because device_put returns a DA. In the future (with IFRT), it will return an `Array`.

`addressable_shards` wraps DA into jax.Array with a `SingleDeviceSharding`.

PiperOrigin-RevId: 453319811

											
										
										
											2022-06-06 17:31:20 -07:00
-												Make `jnp.array` return `jax.Array`. Add input and result handlers for `jax.Array`. Also added tests for `add` under jit.

TODO:
* Don't allow `x + y` if `jax.Array` is not fully addressable.
* Figure out how to use the already written tests with Array. Might be able to follow the path taken by SDA.
PiperOrigin-RevId: 457034779

											
										
										
											2022-06-24 10:04:31 -07:00
+								  @property
-												Add weak type support to Array. Also make all api_test.py tests pass with Array. I have disabled the `float0` test for now until I investigate.

PiperOrigin-RevId: 468264910

											
										
										
											2022-08-17 12:25:14 -07:00
+								  def dtype(self):
 								    return self.aval.dtype
-												Make `jnp.array` return `jax.Array`. Add input and result handlers for `jax.Array`. Also added tests for `add` under jit.

TODO:
* Don't allow `x + y` if `jax.Array` is not fully addressable.
* Figure out how to use the already written tests with Array. Might be able to follow the path taken by SDA.
PiperOrigin-RevId: 457034779

											
										
										
											2022-06-24 10:04:31 -07:00
-												Adding `jax.Array` to jax.experimental. Its pretty much the same as GDA (without the performance optimization for now).

Currently, jax.Array takes DeviceArrays in `assemble_array` because device_put returns a DA. In the future (with IFRT), it will return an `Array`.

`addressable_shards` wraps DA into jax.Array with a `SingleDeviceSharding`.

PiperOrigin-RevId: 453319811

											
										
										
											2022-06-06 17:31:20 -07:00
+								  @property
 								  def ndim(self):
 								    return len(self.shape)
 								  @property
 								  def size(self):
 								    return prod(self.shape)
 								  @property
 								  def sharding(self):
 								    return self._sharding
-												Make checkify tests pass with Array and add methods on Array that are present on DA.

PiperOrigin-RevId: 468058909

											
										
										
											2022-08-16 16:51:26 -07:00
+								  def __str__(self):
 								    return str(self._value)
 								  def __len__(self):
 								    try:
 								      return self.shape[0]
 								    except IndexError as err:
 								      raise TypeError("len() of unsized object") from err  # same as numpy error
 								  def __bool__(self):
 								    return bool(self._value)
 								  def __nonzero__(self):
 								    return bool(self._value)
 								  def __float__(self):
 								    return self._value.__float__()
 								  def __int__(self):
 								    return self._value.__int__()
 								  def __complex__(self):
 								    return self._value.__complex__()
 								  def __hex__(self):
 								    assert self.ndim == 0, 'hex only works on scalar values'
 								    return hex(self._value)  # type: ignore
 								  def __oct__(self):
 								    assert self.ndim == 0, 'oct only works on scalar values'
 								    return oct(self._value)  # type: ignore
 								  def __index__(self):
-												Add weak type support to Array. Also make all api_test.py tests pass with Array. I have disabled the `float0` test for now until I investigate.

PiperOrigin-RevId: 468264910

											
										
										
											2022-08-17 12:25:14 -07:00
+								    return op.index(self._value)
-												Make checkify tests pass with Array and add methods on Array that are present on DA.

PiperOrigin-RevId: 468058909

											
										
										
											2022-08-16 16:51:26 -07:00
-												Add support for interoperability via dlpack for Array and also make pickle_tests and lax_numpy_test pass with Array.

PiperOrigin-RevId: 468568917

											
										
										
											2022-08-18 15:58:40 -07:00
+								  def tobytes(self, order="C"):
-												Make checkify tests pass with Array and add methods on Array that are present on DA.

PiperOrigin-RevId: 468058909

											
										
										
											2022-08-16 16:51:26 -07:00
+								    return self._value.tobytes(order)
 								  def tolist(self):
 								    return self._value.tolist()
 								  def __format__(self, format_spec):
 								    # Simulates behavior of https://github.com/numpy/numpy/pull/9883
 								    if self.ndim == 0:
 								      return format(self._value[()], format_spec)
 								    else:
 								      return format(self._value, format_spec)
 								  def __iter__(self):
 								    if self.ndim == 0:
 								      raise TypeError("iteration over a 0-d array")  # same as numpy error
 								    else:
 								      # chunk_iter is added to Array in lax_numpy.py similar to DA.
 								      return (sl for chunk in self._chunk_iter(100) for sl in chunk._unstack())  # type: ignore
 								  def item(self):
 								    if dtypes.issubdtype(self.dtype, np.complexfloating):
 								      return complex(self)
 								    elif dtypes.issubdtype(self.dtype, np.floating):
 								      return float(self)
 								    elif dtypes.issubdtype(self.dtype, np.integer):
 								      return int(self)
 								    elif dtypes.issubdtype(self.dtype, np.bool_):
 								      return bool(self)
 								    else:
 								      raise TypeError(self.dtype)
-												`__repr__` if an Array is fully replicated. Its the same for `_value` so it makes sense to do the same for `__repr__`.

PiperOrigin-RevId: 469892350

											
										
										
											2022-08-24 20:41:48 -07:00
+								  def is_fully_replicated(self) -> bool:
 								    return self.shape == self._arrays[0].shape
-												Add `__repr__` to `Array`. It works exactly as it does for DA and SDA when it is fully addressable. Otherwise it works like GDA.

TODO is adding weak_type support in general and to `__repr__`.

PiperOrigin-RevId: 455680796

											
										
										
											2022-06-17 13:11:52 -07:00
+								  def __repr__(self):
 								    prefix = '{}('.format(self.__class__.__name__.lstrip('_'))
-												Add weak type support to Array. Also make all api_test.py tests pass with Array. I have disabled the `float0` test for now until I investigate.

PiperOrigin-RevId: 468264910

											
										
										
											2022-08-17 12:25:14 -07:00
+								    if self.aval is not None and self.aval.weak_type:
 								      dtype_str = f'dtype={self.dtype.name}, weak_type=True)'
 								    else:
 								      dtype_str = f'dtype={self.dtype.name})'
-												Add `__repr__` to `Array`. It works exactly as it does for DA and SDA when it is fully addressable. Otherwise it works like GDA.

TODO is adding weak_type support in general and to `__repr__`.

PiperOrigin-RevId: 455680796

											
										
										
											2022-06-17 13:11:52 -07:00
-												`__repr__` if an Array is fully replicated. Its the same for `_value` so it makes sense to do the same for `__repr__`.

PiperOrigin-RevId: 469892350

											
										
										
											2022-08-24 20:41:48 -07:00
+								    if self.is_fully_addressable() or self.is_fully_replicated():
-												Add `__repr__` to `Array`. It works exactly as it does for DA and SDA when it is fully addressable. Otherwise it works like GDA.

TODO is adding weak_type support in general and to `__repr__`.

PiperOrigin-RevId: 455680796

											
										
										
											2022-06-17 13:11:52 -07:00
+								      line_width = np.get_printoptions()["linewidth"]
 								      s = np.array2string(self._value, prefix=prefix, suffix=',',
 								                          separator=', ', max_line_width=line_width)
 								      last_line_len = len(s) - s.rfind('\n') + 1
 								      sep = ' '
 								      if last_line_len + len(dtype_str) + 1 > line_width:
 								        sep = ' ' * len(prefix)
 								      return f"{prefix}{s},{sep}{dtype_str}"
 								    else:
-												Allow `to_py()` on Array if the sharding is fully replicated.

PiperOrigin-RevId: 469617855

											
										
										
											2022-08-23 19:48:59 -07:00
+								      return f"{prefix}{self.shape}, {dtype_str}"
-												Add `__repr__` to `Array`. It works exactly as it does for DA and SDA when it is fully addressable. Otherwise it works like GDA.

TODO is adding weak_type support in general and to `__repr__`.

PiperOrigin-RevId: 455680796

											
										
										
											2022-06-17 13:11:52 -07:00
-												Adding `jax.Array` to jax.experimental. Its pretty much the same as GDA (without the performance optimization for now).

Currently, jax.Array takes DeviceArrays in `assemble_array` because device_put returns a DA. In the future (with IFRT), it will return an `Array`.

`addressable_shards` wraps DA into jax.Array with a `SingleDeviceSharding`.

PiperOrigin-RevId: 453319811

											
										
										
											2022-06-06 17:31:20 -07:00
+								  def is_fully_addressable(self) -> bool:
-												Make lower_mesh_computation accept sharding instances. The new path is tested as everything in pjit goes through the new `lower_sharding_computation` except of `AUTO` and `UNSPECIFIED` (see below for these 2).

* Split `lower_mesh_computation` into `lower_mesh_computation` and `lower_sharding_computation`. This is because `lower_mesh_computation` handles 3 paths; `spmd lowering path`, `non-spmd lowering path` and `xmap spmd lowering path`. I didn't want to add a 4th path to it for general shardings.
  * `lower_sharding_computation` works in SPMD mode since its only used in pjit. Majority of the logic is the same. The only difference is that `mesh` does not exist in this function.

* `MeshComputation` is the point where `lower_mesh_computation` and `lower_sharding_computation` merge.

* `AUTO` and `UNSPECIFIED` cannot be used without mesh right now but I have a CL to fix this.

* Rest of the changes are to make all other functions play nicely with sharding instances.

PiperOrigin-RevId: 461260553

											
										
										
											2022-07-15 16:12:42 -07:00
+								    return self.sharding.is_fully_addressable()
-												Adding `jax.Array` to jax.experimental. Its pretty much the same as GDA (without the performance optimization for now).

Currently, jax.Array takes DeviceArrays in `assemble_array` because device_put returns a DA. In the future (with IFRT), it will return an `Array`.

`addressable_shards` wraps DA into jax.Array with a `SingleDeviceSharding`.

PiperOrigin-RevId: 453319811

											
										
										
											2022-06-06 17:31:20 -07:00
-												Add context to `__array__` of Array just like DA.

PiperOrigin-RevId: 469874479

											
										
										
											2022-08-24 18:27:40 -07:00
+								  def __array__(self, dtype=None, context=None):
-												Add `__array__` (for device_get), `_npy_value`, `block_until_ready`, `delete` and `_check_if_deleted` to Array.

PiperOrigin-RevId: 454741685

											
										
										
											2022-06-13 18:07:55 -07:00
+								    return np.asarray(self._value, dtype=dtype)
-												Add support for interoperability via dlpack for Array and also make pickle_tests and lax_numpy_test pass with Array.

PiperOrigin-RevId: 468568917

											
										
										
											2022-08-18 15:58:40 -07:00
+								  def __dlpack__(self):
 								    from jax.dlpack import to_dlpack  # pylint: disable=g-import-not-at-top
 								    return to_dlpack(self)
 								  def __reduce__(self):
 								    fun, args, arr_state = self._value.__reduce__()
 								    aval_state = {'weak_type': self.aval.weak_type,
 								                  'named_shape': self.aval.named_shape}
 								    return (_reconstruct_array, (fun, args, arr_state, aval_state))
-												Add weak type support to Array. Also make all api_test.py tests pass with Array. I have disabled the `float0` test for now until I investigate.

PiperOrigin-RevId: 468264910

											
										
										
											2022-08-17 12:25:14 -07:00
+								  # TODO(yashkatariya): Remove this method when everyone is using devices().
 								  def device(self) -> Device:
-												Add support for interoperability via dlpack for Array and also make pickle_tests and lax_numpy_test pass with Array.

PiperOrigin-RevId: 468568917

											
										
										
											2022-08-18 15:58:40 -07:00
+								    self._check_if_deleted()
-												Add weak type support to Array. Also make all api_test.py tests pass with Array. I have disabled the `float0` test for now until I investigate.

PiperOrigin-RevId: 468264910

											
										
										
											2022-08-17 12:25:14 -07:00
+								    device_set = self.sharding.device_set
 								    if len(device_set) == 1:
 								      single_device, = device_set
 								      return single_device
 								    raise ValueError('Length of devices is greater than 1. '
 								                     'Please use `.devices()`.')
 								  def devices(self) -> List[Device]:
-												Add support for interoperability via dlpack for Array and also make pickle_tests and lax_numpy_test pass with Array.

PiperOrigin-RevId: 468568917

											
										
										
											2022-08-18 15:58:40 -07:00
+								    self._check_if_deleted()
-												Add weak type support to Array. Also make all api_test.py tests pass with Array. I have disabled the `float0` test for now until I investigate.

PiperOrigin-RevId: 468264910

											
										
										
											2022-08-17 12:25:14 -07:00
+								    return list(self.sharding.device_set)
-												Add the Shard class from GDA to `jax.Array` to make the management of shards easier and less verbose.

PiperOrigin-RevId: 453330349

											
										
										
											2022-06-06 18:44:45 -07:00
+								  @pxla.maybe_cached_property
 								  def addressable_shards(self) -> Sequence[Shard]:
-												Fix the _check_if_deleted check that was merged at the wrong place by the cider merging machinery.

PiperOrigin-RevId: 454912448

											
										
										
											2022-06-14 11:23:07 -07:00
+								    self._check_if_deleted()
-												Add the Shard class from GDA to `jax.Array` to make the management of shards easier and less verbose.

PiperOrigin-RevId: 453330349

											
										
										
											2022-06-06 18:44:45 -07:00
+								    out = []
 								    for db in self._arrays:
 								      db = pxla._set_aval(db)
 								      device = db.device()
 								      # Wrap the device arrays in `Array` until C++ returns an Array instead
 								      # of a DA.
-												Enable fast path in the Array constructor. This means that the rearranging of `_arrays` according to the device_assignment won't happen when fastpath is enabled because we assume that jax transformations will return the right arrangement.

PiperOrigin-RevId: 469492283

											
										
										
											2022-08-23 10:19:59 -07:00
+								      array = Array(db.aval, SingleDeviceSharding(device), [db], committed=True,
 								                    _skip_checks=True)
-												Make `Shard` a normal class making `index` and `replica_id` properties on that class. Raise an error if an indices cannot be calculated from a sharding.

PiperOrigin-RevId: 454899275

											
										
										
											2022-06-14 10:34:19 -07:00
+								      out.append(Shard(device, self.sharding, self.shape, array))
-												Add the Shard class from GDA to `jax.Array` to make the management of shards easier and less verbose.

PiperOrigin-RevId: 453330349

											
										
										
											2022-06-06 18:44:45 -07:00
+								    return out
-												Adding `jax.Array` to jax.experimental. Its pretty much the same as GDA (without the performance optimization for now).

Currently, jax.Array takes DeviceArrays in `assemble_array` because device_put returns a DA. In the future (with IFRT), it will return an `Array`.

`addressable_shards` wraps DA into jax.Array with a `SingleDeviceSharding`.

PiperOrigin-RevId: 453319811

											
										
										
											2022-06-06 17:31:20 -07:00
-												Add `__array__` (for device_get), `_npy_value`, `block_until_ready`, `delete` and `_check_if_deleted` to Array.

PiperOrigin-RevId: 454741685

											
										
										
											2022-06-13 18:07:55 -07:00
+								  def delete(self):
 								    if self._arrays is None:
 								      return
 								    for buf in self._arrays:
 								      buf.delete()
 								    self._arrays = None
 								    self._npy_value = None
-												Add support for interoperability via dlpack for Array and also make pickle_tests and lax_numpy_test pass with Array.

PiperOrigin-RevId: 468568917

											
										
										
											2022-08-18 15:58:40 -07:00
+								  def is_deleted(self):
 								    return all(buf.is_deleted() for buf in self._arrays)
-												Add `__array__` (for device_get), `_npy_value`, `block_until_ready`, `delete` and `_check_if_deleted` to Array.

PiperOrigin-RevId: 454741685

											
										
										
											2022-06-13 18:07:55 -07:00
+								  def _check_if_deleted(self):
 								    if self._arrays is None:
-												Add weak type support to Array. Also make all api_test.py tests pass with Array. I have disabled the `float0` test for now until I investigate.

PiperOrigin-RevId: 468264910

											
										
										
											2022-08-17 12:25:14 -07:00
+								      raise RuntimeError("Array has been deleted.")
-												Add `__array__` (for device_get), `_npy_value`, `block_until_ready`, `delete` and `_check_if_deleted` to Array.

PiperOrigin-RevId: 454741685

											
										
										
											2022-06-13 18:07:55 -07:00
 								  def block_until_ready(self):
 								    self._check_if_deleted()
 								    for db in self._arrays:
 								      db.block_until_ready()
 								    return self
-												Adding `jax.Array` to jax.experimental. Its pretty much the same as GDA (without the performance optimization for now).

Currently, jax.Array takes DeviceArrays in `assemble_array` because device_put returns a DA. In the future (with IFRT), it will return an `Array`.

`addressable_shards` wraps DA into jax.Array with a `SingleDeviceSharding`.

PiperOrigin-RevId: 453319811

											
										
										
											2022-06-06 17:31:20 -07:00
+								  def copy_to_host_async(self):
-												Add `__array__` (for device_get), `_npy_value`, `block_until_ready`, `delete` and `_check_if_deleted` to Array.

PiperOrigin-RevId: 454741685

											
										
										
											2022-06-13 18:07:55 -07:00
+								    self._check_if_deleted()
 								    if self._npy_value is None:
-												Make `Shard` a normal class making `index` and `replica_id` properties on that class. Raise an error if an indices cannot be calculated from a sharding.

PiperOrigin-RevId: 454899275

											
										
										
											2022-06-14 10:34:19 -07:00
+								      try:
 								        self.addressable_shards[0].replica_id
 								        replica_id_exists = True
 								      except ValueError:
 								        replica_id_exists = False
-												Add `__array__` (for device_get), `_npy_value`, `block_until_ready`, `delete` and `_check_if_deleted` to Array.

PiperOrigin-RevId: 454741685

											
										
										
											2022-06-13 18:07:55 -07:00
+								      for s in self.addressable_shards:
-												Fix the _check_if_deleted check that was merged at the wrong place by the cider merging machinery.

PiperOrigin-RevId: 454912448

											
										
										
											2022-06-14 11:23:07 -07:00
+								        if not replica_id_exists or s.replica_id == 0:
-												Make `Shard` a normal class making `index` and `replica_id` properties on that class. Raise an error if an indices cannot be calculated from a sharding.

PiperOrigin-RevId: 454899275

											
										
										
											2022-06-14 10:34:19 -07:00
+								          s.data._arrays[0].copy_to_host_async()  # pytype: disable=attribute-error
-												Adding `jax.Array` to jax.experimental. Its pretty much the same as GDA (without the performance optimization for now).

Currently, jax.Array takes DeviceArrays in `assemble_array` because device_put returns a DA. In the future (with IFRT), it will return an `Array`.

`addressable_shards` wraps DA into jax.Array with a `SingleDeviceSharding`.

PiperOrigin-RevId: 453319811

											
										
										
											2022-06-06 17:31:20 -07:00
-												Add `__array__` (for device_get), `_npy_value`, `block_until_ready`, `delete` and `_check_if_deleted` to Array.

PiperOrigin-RevId: 454741685

											
										
										
											2022-06-13 18:07:55 -07:00
+								  @property
-												Adding `jax.Array` to jax.experimental. Its pretty much the same as GDA (without the performance optimization for now).

Currently, jax.Array takes DeviceArrays in `assemble_array` because device_put returns a DA. In the future (with IFRT), it will return an `Array`.

`addressable_shards` wraps DA into jax.Array with a `SingleDeviceSharding`.

PiperOrigin-RevId: 453319811

											
										
										
											2022-06-06 17:31:20 -07:00
+								  def _value(self) -> np.ndarray:
-												Add `__array__` (for device_get), `_npy_value`, `block_until_ready`, `delete` and `_check_if_deleted` to Array.

PiperOrigin-RevId: 454741685

											
										
										
											2022-06-13 18:07:55 -07:00
+								    self._check_if_deleted()
-												Allow `to_py()` on Array if the sharding is fully replicated.

PiperOrigin-RevId: 469617855

											
										
										
											2022-08-23 19:48:59 -07:00
-												Add `__array__` (for device_get), `_npy_value`, `block_until_ready`, `delete` and `_check_if_deleted` to Array.

PiperOrigin-RevId: 454741685

											
										
										
											2022-06-13 18:07:55 -07:00
+								    if self._npy_value is None:
-												`__repr__` if an Array is fully replicated. Its the same for `_value` so it makes sense to do the same for `__repr__`.

PiperOrigin-RevId: 469892350

											
										
										
											2022-08-24 20:41:48 -07:00
+								      if self.is_fully_replicated():
 								        self._npy_value = np.asarray(self._arrays[0])  # type: ignore
 								        return cast(np.ndarray, self._npy_value)
-												Allow `to_py()` on Array if the sharding is fully replicated.

PiperOrigin-RevId: 469617855

											
										
										
											2022-08-23 19:48:59 -07:00
 								      if not self.is_fully_addressable():
 								        raise RuntimeError("Fetching value for `jax.Array` that spans "
 								                           "non-addressable devices is not possible. You can use "
 								                           "`jax.experimental.multihost_utils.process_allgather` "
 								                           "for this use case.")
-												Add `__array__` (for device_get), `_npy_value`, `block_until_ready`, `delete` and `_check_if_deleted` to Array.

PiperOrigin-RevId: 454741685

											
										
										
											2022-06-13 18:07:55 -07:00
+								      self.copy_to_host_async()
 								      npy_value = np.empty(self.shape, self.dtype)
-												Make `Shard` a normal class making `index` and `replica_id` properties on that class. Raise an error if an indices cannot be calculated from a sharding.

PiperOrigin-RevId: 454899275

											
										
										
											2022-06-14 10:34:19 -07:00
 								      try:
 								        self.addressable_shards[0].replica_id
 								        replica_id_exists = True
 								      except ValueError:
 								        replica_id_exists = False
-												Add `__array__` (for device_get), `_npy_value`, `block_until_ready`, `delete` and `_check_if_deleted` to Array.

PiperOrigin-RevId: 454741685

											
										
										
											2022-06-13 18:07:55 -07:00
+								      for s in self.addressable_shards:
-												Fix the _check_if_deleted check that was merged at the wrong place by the cider merging machinery.

PiperOrigin-RevId: 454912448

											
										
										
											2022-06-14 11:23:07 -07:00
+								        if not replica_id_exists or s.replica_id == 0:
-												[JAX] Deprecate .to_py() property on arrays. Implement __array__ instead.

.to_py() was something of an accidental export from the JAX array classes. There are other mechanisms to turn a JAX array into a NumPy array, including `np.asarray(x)` and `jax.device_get(x)`. Deprecate this mechanism because it is redundant.

PiperOrigin-RevId: 469984029

											
										
										
											2022-08-25 07:27:54 -07:00
+								          npy_value[s.index] = np.asarray(s.data._arrays[0])  # type: ignore  # [union-attr]
-												Add `__array__` (for device_get), `_npy_value`, `block_until_ready`, `delete` and `_check_if_deleted` to Array.

PiperOrigin-RevId: 454741685

											
										
										
											2022-06-13 18:07:55 -07:00
+								      self._npy_value = npy_value  # type: ignore
 								    # https://docs.python.org/3/library/typing.html#typing.cast
 								    return cast(np.ndarray, self._npy_value)
-												Adding `jax.Array` to jax.experimental. Its pretty much the same as GDA (without the performance optimization for now).

Currently, jax.Array takes DeviceArrays in `assemble_array` because device_put returns a DA. In the future (with IFRT), it will return an `Array`.

`addressable_shards` wraps DA into jax.Array with a `SingleDeviceSharding`.

PiperOrigin-RevId: 453319811

											
										
										
											2022-06-06 17:31:20 -07:00
-												Add weak type support to Array. Also make all api_test.py tests pass with Array. I have disabled the `float0` test for now until I investigate.

PiperOrigin-RevId: 468264910

											
										
										
											2022-08-17 12:25:14 -07:00
+								# explicitly set to be unhashable. Same as what device_array.py does.
 								setattr(Array, "__hash__", None)
-												Adding `jax.Array` to jax.experimental. Its pretty much the same as GDA (without the performance optimization for now).

Currently, jax.Array takes DeviceArrays in `assemble_array` because device_put returns a DA. In the future (with IFRT), it will return an `Array`.

`addressable_shards` wraps DA into jax.Array with a `SingleDeviceSharding`.

PiperOrigin-RevId: 453319811

											
										
										
											2022-06-06 17:31:20 -07:00
 								def make_array_from_callback(shape: Shape, sharding: Sharding,
 								                             data_callback: Callable[[Optional[Index]], ArrayLike]) -> Array:
-												Return `Array` from `jax.device_put` if `config.jax_array` is enabled.

PiperOrigin-RevId: 456531510

											
										
										
											2022-06-22 09:20:26 -07:00
+								  arrays = [
-												Adding `jax.Array` to jax.experimental. Its pretty much the same as GDA (without the performance optimization for now).

Currently, jax.Array takes DeviceArrays in `assemble_array` because device_put returns a DA. In the future (with IFRT), it will return an `Array`.

`addressable_shards` wraps DA into jax.Array with a `SingleDeviceSharding`.

PiperOrigin-RevId: 453319811

											
										
										
											2022-06-06 17:31:20 -07:00
+								      device_put(data_callback(sharding.device_indices(device, shape)), device)
 								      for device in sharding.addressable_devices
 								  ]
-												Add weak type support to Array. Also make all api_test.py tests pass with Array. I have disabled the `float0` test for now until I investigate.

PiperOrigin-RevId: 468264910

											
										
										
											2022-08-17 12:25:14 -07:00
+								  aval = core.ShapedArray(shape, arrays[0].dtype, weak_type=False)
 								  return Array(aval, sharding, arrays, committed=True)
-												Add pjit support for `Array`. `Array` takes the same codepath as GDA so there are very little modifications to pjit. Add handlers aval, shard_args and result handlers for Array.

PiperOrigin-RevId: 454160854

											
										
										
											2022-06-10 07:31:43 -07:00
-												Array bug: make pytype_aval_mapping return a ConcreteShapedArray

											
										
										
											2022-08-18 12:31:30 -07:00
+								core.pytype_aval_mappings[Array] = abstract_arrays.canonical_concrete_aval
-												Add weak type support to Array. Also make all api_test.py tests pass with Array. I have disabled the `float0` test for now until I investigate.

PiperOrigin-RevId: 468264910

											
										
										
											2022-08-17 12:25:14 -07:00
+								xla.pytype_aval_mappings[Array] = op.attrgetter('aval')
-												Add pjit support for `Array`. `Array` takes the same codepath as GDA so there are very little modifications to pjit. Add handlers aval, shard_args and result handlers for Array.

PiperOrigin-RevId: 454160854

											
										
										
											2022-06-10 07:31:43 -07:00
+								xla.canonicalize_dtype_handlers[Array] = pxla.identity
-												Add weak type support to Array. Also make all api_test.py tests pass with Array. I have disabled the `float0` test for now until I investigate.

PiperOrigin-RevId: 468264910

											
										
										
											2022-08-17 12:25:14 -07:00
+								api_util._shaped_abstractify_handlers[Array] = op.attrgetter('aval')
-												Make all pmap tests pass with Array! I am skipping all soft pmap tests for now.

PiperOrigin-RevId: 467264992

											
										
										
											2022-08-12 12:09:22 -07:00
+								ad_util.jaxval_adders[Array] = lax_internal.add
 								ad_util.jaxval_zeros_likers[Array] = lax_internal.zeros_like_array
-												Avoid import-time dependency on jax.experimental

											
										
										
											2022-08-19 11:30:25 -07:00
+								ndarray.register(Array)
-												Make all pmap tests pass with Array! I am skipping all soft pmap tests for now.

PiperOrigin-RevId: 467264992

											
										
										
											2022-08-12 12:09:22 -07:00
 								def _array_mlir_constant_handler(val, canonicalize_types=True):
 								  return mlir.ir_constants(val._value,
 								                           canonicalize_types=canonicalize_types)
 								mlir.register_constant_handler(Array, _array_mlir_constant_handler)
-												Add pjit support for `Array`. `Array` takes the same codepath as GDA so there are very little modifications to pjit. Add handlers aval, shard_args and result handlers for Array.

PiperOrigin-RevId: 454160854

											
										
										
											2022-06-10 07:31:43 -07:00
-												Make `jnp.array` return `jax.Array`. Add input and result handlers for `jax.Array`. Also added tests for `add` under jit.

TODO:
* Don't allow `x + y` if `jax.Array` is not fully addressable.
* Figure out how to use the already written tests with Array. Might be able to follow the path taken by SDA.
PiperOrigin-RevId: 457034779

											
										
										
											2022-06-24 10:04:31 -07:00
 								def _device_put_array(x, device: Optional[Device]):
-												Make `astype` work for `Array` that are sharded. The current behavior is the same as SDA i.e. it round trips via host.

PiperOrigin-RevId: 457797458

											
										
										
											2022-06-28 12:48:39 -07:00
+								  # TODO(yashkatariya): Remove this restriction and the round trip via host
 								  # once lowering to XLA goes through `lower_mesh_computation`.
 								  assert x.is_fully_addressable()
 								  if isinstance(x.sharding, SingleDeviceSharding):
 								    x = dispatch._copy_device_array_to_device(pxla._set_aval(x._arrays[0]), device)
 								    return (x,)
 								  else:
 								    # Round trip via host if x is sharded. SDA also does a round trip via host.
 								    return dispatch._device_put_array(x._value, device)
-												Make `jnp.array` return `jax.Array`. Add input and result handlers for `jax.Array`. Also added tests for `add` under jit.

TODO:
* Don't allow `x + y` if `jax.Array` is not fully addressable.
* Figure out how to use the already written tests with Array. Might be able to follow the path taken by SDA.
PiperOrigin-RevId: 457034779

											
										
										
											2022-06-24 10:04:31 -07:00
+								dispatch.device_put_handlers[Array] = _device_put_array
-												Make eager pmap tests pass with `Array`. Also add a slow path for Array in `pmap` similar to what SDA has. This is required for eager pmap. Adding a slow path removes the need for doing sharding checks in api.py because SDA doesn't do those checks and if the sharding does not match with pmap sharding, then it just defaults to the slow path (exactly like SDA).

PiperOrigin-RevId: 468843310

											
										
										
											2022-08-19 21:36:43 -07:00
+								def _array_pmap_shard_arg(x, devices, indices, mode):
 								  if isinstance(x.sharding, SingleDeviceSharding):
 								    return pxla._shard_device_array(x, devices, indices, mode)
 								  # If the sharding of Array does not match pmap's sharding then take the slow
 								  # path which is similar to what SDA does. This slow path reroute only happens
 								  # for `pmap`.
 								  if indices == tuple(x.sharding.devices_indices_map(x.shape).values()):
-												Pmap should output SDA like `Array`s to maintain the current behavior exactly. Split the shard_arg_handler for `Array` based on whether the mode is pmap or pjit. Why do this? The doc below explains more about the context.

PiperOrigin-RevId: 466849614

											
										
										
											2022-08-10 20:11:06 -07:00
+								    return [buf if buf.device() == d else buf.copy_to_device(d)
 								            for buf, d in safe_zip(x._arrays, devices)]
-												Make eager pmap tests pass with `Array`. Also add a slow path for Array in `pmap` similar to what SDA has. This is required for eager pmap. Adding a slow path removes the need for doing sharding checks in api.py because SDA doesn't do those checks and if the sharding does not match with pmap sharding, then it just defaults to the slow path (exactly like SDA).

PiperOrigin-RevId: 468843310

											
										
										
											2022-08-19 21:36:43 -07:00
+								  else:
 								    return pxla._shard_sharded_device_array_slow_path(x, devices, indices, mode)
 								def _array_shard_arg(x, devices, indices, mode):
 								  if mode == pxla.InputsHandlerMode.pmap:
 								    return _array_pmap_shard_arg(x, devices, indices, mode)
-												Pmap should output SDA like `Array`s to maintain the current behavior exactly. Split the shard_arg_handler for `Array` based on whether the mode is pmap or pjit. Why do this? The doc below explains more about the context.

PiperOrigin-RevId: 466849614

											
										
										
											2022-08-10 20:11:06 -07:00
+								  else:
 								    return x._arrays
-												Add pjit support for `Array`. `Array` takes the same codepath as GDA so there are very little modifications to pjit. Add handlers aval, shard_args and result handlers for Array.

PiperOrigin-RevId: 454160854

											
										
										
											2022-06-10 07:31:43 -07:00
+								pxla.shard_arg_handlers[Array] = _array_shard_arg
-												Pmap should output SDA like `Array`s to maintain the current behavior exactly. Split the shard_arg_handler for `Array` based on whether the mode is pmap or pjit. Why do this? The doc below explains more about the context.

PiperOrigin-RevId: 466849614

											
										
										
											2022-08-10 20:11:06 -07:00
+								def _array_global_result_handler(global_aval, out_sharding):
-												support `jax.experimental.array.Array` as a base array for key arrays

Only handle host-locally sharded `Array`s for now (like in SDAs under
`pmap`). Leaving global sharding for a follow up.

Also re-enable a previously skipped test as a result.

Co-authored-by: Yash Katariya <yashkatariya@google.com>
PiperOrigin-RevId: 469885160

											
										
										
											2022-08-24 19:48:36 -07:00
+								  if core.aval_has_custom_eltype(global_aval):
 								    return global_aval.dtype.global_sharded_result_handler(
 								        global_aval, out_sharding)
 								  else:
 								    return lambda bufs: Array(global_aval, out_sharding, bufs, committed=True,
 								                              _skip_checks=True)
-												Pmap should output SDA like `Array`s to maintain the current behavior exactly. Split the shard_arg_handler for `Array` based on whether the mode is pmap or pjit. Why do this? The doc below explains more about the context.

PiperOrigin-RevId: 466849614

											
										
										
											2022-08-10 20:11:06 -07:00
+								pxla.global_result_handlers[(core.ShapedArray, pxla.OutputType.Array)] = _array_global_result_handler
 								pxla.global_result_handlers[(core.ConcreteArray, pxla.OutputType.Array)] = _array_global_result_handler
 								def _array_local_result_handler(aval, sharding, indices):
-												support `jax.experimental.array.Array` as a base array for key arrays

Only handle host-locally sharded `Array`s for now (like in SDAs under
`pmap`). Leaving global sharding for a follow up.

Also re-enable a previously skipped test as a result.

Co-authored-by: Yash Katariya <yashkatariya@google.com>
PiperOrigin-RevId: 469885160

											
										
										
											2022-08-24 19:48:36 -07:00
+								  if core.aval_has_custom_eltype(aval):
 								    return aval.dtype.local_sharded_result_handler(aval, sharding, indices)
 								  else:
 								    return lambda bufs: Array(aval, sharding, bufs, committed=True,
 								                              _skip_checks=True)
-												Pmap should output SDA like `Array`s to maintain the current behavior exactly. Split the shard_arg_handler for `Array` based on whether the mode is pmap or pjit. Why do this? The doc below explains more about the context.

PiperOrigin-RevId: 466849614

											
										
										
											2022-08-10 20:11:06 -07:00
+								pxla.local_result_handlers[(core.ShapedArray, pxla.OutputType.Array)] = _array_local_result_handler
 								pxla.local_result_handlers[(core.ConcreteArray, pxla.OutputType.Array)] = _array_local_result_handler