`declearn.model.torch.TorchVector`

Bases: Vector

Vector subclass to store PyTorch tensors.

This Vector is designed to store a collection of named PyTorch tensors, enabling computations that are either applied to each and every coefficient, or imply two sets of aligned coefficients (i.e. two TorchVector with similar specifications).

Use vector.coefs to access the stored coefficients.

Notes

A TorchVector can be operated with either a:
- scalar value
- NumpyVector that has similar specifications
- TorchVector that has similar specifications
- => resulting in a TorchVector in each of these cases.
The wrapped tensors may be placed on any device (CPU, GPU...) and may not be all on the same device.
The device-placement of the initial TorchVector's data is preserved by operations, including with NumpyVector.
When combining two TorchVector, the device-placement of the left-most one is used; in that case, one ends up with gpu + cpu = gpu while cpu + gpu = cpu. In both cases, a warning will be emitted to prevent silent un-optimized copies.
When deserializing a TorchVector (either by directly using TorchVector.unpack or loading one from a JSON dump), loaded tensors are placed based on the global device-placement policy (accessed via declearn.utils.get_device_policy). Thus it may have a different device-placement schema than at dump time but should be coherent with that of TorchModel computations.

Source code in declearn/model/torch/_vector.py

@register_vector_type(torch.Tensor)
class TorchVector(Vector):
    """Vector subclass to store PyTorch tensors.

    This Vector is designed to store a collection of named PyTorch
    tensors, enabling computations that are either applied to each
    and every coefficient, or imply two sets of aligned coefficients
    (i.e. two TorchVector with similar specifications).

    Use `vector.coefs` to access the stored coefficients.

    Notes
    -----
    - A `TorchVector` can be operated with either a:
        - scalar value
        - `NumpyVector` that has similar specifications
        - `TorchVector` that has similar specifications
        - => resulting in a `TorchVector` in each of these cases.
    - The wrapped tensors may be placed on any device (CPU, GPU...)
      and may not be all on the same device.
    - The device-placement of the initial `TorchVector`'s data
      is preserved by operations, including with `NumpyVector`.
    - When combining two `TorchVector`, the device-placement
      of the left-most one is used; in that case, one ends up with
      `gpu + cpu = gpu` while `cpu + gpu = cpu`. In both cases, a
      warning will be emitted to prevent silent un-optimized copies.
    - When deserializing a `TorchVector` (either by directly using
      `TorchVector.unpack` or loading one from a JSON dump), loaded
      tensors are placed based on the global device-placement policy
      (accessed via `declearn.utils.get_device_policy`). Thus it may
      have a different device-placement schema than at dump time but
      should be coherent with that of `TorchModel` computations.
    """

    @property
    def _op_add(self) -> Callable[[Any, Any], Any]:
        return torch.add

    @property
    def _op_sub(self) -> Callable[[Any, Any], Any]:
        return torch.sub

    @property
    def _op_mul(self) -> Callable[[Any, Any], Any]:
        return torch.mul

    @property
    def _op_div(self) -> Callable[[Any, Any], Any]:
        return torch.div

    @property
    def _op_pow(self) -> Callable[[Any, Any], Any]:
        return torch.pow

    @property
    def compatible_vector_types(self) -> Set[Type[Vector]]:
        types = super().compatible_vector_types
        return types.union({NumpyVector, TorchVector})

    def __init__(self, coefs: Dict[str, torch.Tensor]) -> None:
        super().__init__(coefs)

    def _apply_operation(
        self,
        other: Any,
        func: Callable[[Any, Any], Any],
    ) -> Self:
        # Convert 'other' NumpyVector to a (CPU-backed) TorchVector.
        if isinstance(other, NumpyVector):
            coefs = {
                key: torch.from_numpy(val) for key, val in other.coefs.items()
            }
            other = TorchVector(coefs)
        # Ensure 'other' TorchVector shares this vector's device placement.
        if isinstance(other, TorchVector):
            coefs = {
                key: val.to(self.coefs[key].device)
                for key, val in other.coefs.items()
            }
            other = TorchVector(coefs)
        return super()._apply_operation(other, func)

    def dtypes(
        self,
    ) -> Dict[str, str]:
        dtypes = super().dtypes()
        return {key: val.split(".", 1)[-1] for key, val in dtypes.items()}

    def shapes(
        self,
    ) -> Dict[str, Tuple[int, ...]]:
        return {key: tuple(coef.shape) for key, coef in self.coefs.items()}

    def pack(
        self,
    ) -> Dict[str, Any]:
        return {
            key: np.array(tns.cpu().numpy()) for key, tns in self.coefs.items()
        }

    @classmethod
    def unpack(
        cls,
        data: Dict[str, Any],
    ) -> Self:
        policy = get_device_policy()
        device = select_device(gpu=policy.gpu, idx=policy.idx)
        coefs = {
            key: torch.from_numpy(dat).to(device) for key, dat in data.items()
        }
        return cls(coefs)

    def __eq__(
        self,
        other: Any,
    ) -> bool:
        valid = isinstance(other, TorchVector)
        if valid:
            valid = self.coefs.keys() == other.coefs.keys()
        if valid:
            valid = all(
                # false-positive on 'torch.equal'; pylint: disable=no-member
                torch.equal(tns, other.coefs[key].to(tns.device))
                for key, tns in self.coefs.items()
            )
        return valid

    def sign(self) -> Self:
        return self.apply_func(torch.sign)

    def minimum(
        self,
        other: Union[Self, float],
    ) -> Self:
        if isinstance(other, Vector):
            return self._apply_operation(other, torch.minimum)
        if isinstance(other, float):
            return self._operate_with_float(torch.minimum, other)
        raise TypeError(  # pragma: no cover
            f"Unsupported input type to '{self.__class__.__name__}.minimum'."
        )

    def maximum(
        self,
        other: Union[Self, float],
    ) -> Self:
        if isinstance(other, Vector):
            return self._apply_operation(other, torch.maximum)
        if isinstance(other, float):
            return self._operate_with_float(torch.maximum, other)
        raise TypeError(  # pragma: no cover
            f"Unsupported input type to '{self.__class__.__name__}.maximum'."
        )

    def _operate_with_float(
        self,
        func: Callable[[torch.Tensor, torch.Tensor], torch.Tensor],
        other: float,
    ) -> Self:
        """Apply an operation on coefficients with a single float.

        Handle tensor-conversion and device-placement issues that are
        specific to (some) Torch (functions).
        """
        # Create Tensors wrapping the scalar on each required device.
        device_other = {
            device: torch.Tensor([other]).to(device)
            for device in {val.device for val in self.coefs.values()}
        }
        # Apply the function to coefficients and re-wrap as a TorchVector.
        coefs = {
            key: func(val, device_other[val.device])
            for key, val in self.coefs.items()
        }
        return self.__class__(coefs)

    def sum(
        self,
    ) -> Self:
        coefs = {key: val.sum() for key, val in self.coefs.items()}
        return self.__class__(coefs)

    def flatten(
        self,
    ) -> Tuple[List[float], VectorSpec]:
        v_spec = self.get_vector_specs()
        arrays = self.pack()
        values = flatten_numpy_arrays([arrays[name] for name in v_spec.names])
        return values, v_spec

    @classmethod
    def unflatten(
        cls,
        values: List[float],
        v_spec: VectorSpec,
    ) -> Self:
        shapes = [v_spec.shapes[name] for name in v_spec.names]
        dtypes = [v_spec.dtypes[name] for name in v_spec.names]
        arrays = unflatten_numpy_arrays(values, shapes, dtypes)
        return cls.unpack(dict(zip(v_spec.names, arrays)))