NeelNanda's picture
Made compatible with Python 3.8
c46567d
# Copyright 2022 DeepMind Technologies Limited. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ==============================================================================
"""Vectors and bases."""
import dataclasses
from typing import Sequence, Union, Optional, Iterable
import numpy as np
Name = Union[int, str]
Value = Union[int, float, bool, str, tuple]
@dataclasses.dataclass(frozen=True)
class BasisDirection:
"""Represents a basis direction (no magnitude) in a vector space.
Attributes:
name: a unique name for this direction.
value: used to hold a value one-hot-encoded by this direction. e.g.,
[BasisDirection("vs_1", True), BasisDirection("vs_1", False)] would be
basis directions of a subspace called "vs_1" which one-hot-encodes the
values True and False. If provided, considered part of the name for the
purpose of disambiguating directions.
"""
name: Name
value: Optional[Value] = None
def __str__(self):
if self.value is None:
return str(self.name)
return f"{self.name}:{self.value}"
def __lt__(self, other: "BasisDirection") -> bool:
try:
return (self.name, self.value) < (other.name, other.value)
except TypeError:
return str(self) < str(other)
@dataclasses.dataclass
class VectorInBasis:
"""A vector (or array of vectors) in a given basis.
When magnitudes are 1-d, this is a vector.
When magnitudes are (n+1)-d, this is an array of vectors,
where the -1th dimension is the basis dimension.
"""
basis_directions: Sequence[BasisDirection]
magnitudes: np.ndarray
def __post_init__(self):
"""Sort basis directions."""
if len(self.basis_directions) != self.magnitudes.shape[-1]:
raise ValueError(
"Last dimension of magnitudes must be the same as number "
f"of basis directions. Was {len(self.basis_directions)} "
f"and {self.magnitudes.shape[-1]}.")
sort_idx = np.argsort(self.basis_directions)
self.basis_directions = [self.basis_directions[i] for i in sort_idx]
self.magnitudes = np.take(self.magnitudes, sort_idx, -1)
def __add__(self, other: "VectorInBasis") -> "VectorInBasis":
if self.basis_directions != other.basis_directions:
raise TypeError(f"Adding incompatible bases: {self} + {other}")
magnitudes = self.magnitudes + other.magnitudes
return VectorInBasis(self.basis_directions, magnitudes)
def __radd__(self, other: "VectorInBasis") -> "VectorInBasis":
if self.basis_directions != other.basis_directions:
raise TypeError(f"Adding incompatible bases: {other} + {self}")
return self + other
def __sub__(self, other: "VectorInBasis") -> "VectorInBasis":
if self.basis_directions != other.basis_directions:
raise TypeError(f"Subtracting incompatible bases: {self} - {other}")
magnitudes = self.magnitudes - other.magnitudes
return VectorInBasis(self.basis_directions, magnitudes)
def __rsub__(self, other: "VectorInBasis") -> "VectorInBasis":
if self.basis_directions != other.basis_directions:
raise TypeError(f"Subtracting incompatible bases: {other} - {self}")
magnitudes = other.magnitudes - self.magnitudes
return VectorInBasis(self.basis_directions, magnitudes)
def __mul__(self, scalar: float) -> "VectorInBasis":
return VectorInBasis(self.basis_directions, self.magnitudes * scalar)
def __rmul__(self, scalar: float) -> "VectorInBasis":
return self * scalar
def __truediv__(self, scalar: float) -> "VectorInBasis":
return VectorInBasis(self.basis_directions, self.magnitudes / scalar)
def __neg__(self) -> "VectorInBasis":
return (-1) * self
def __eq__(self, other: "VectorInBasis") -> bool:
return ((self.basis_directions == other.basis_directions) and
(self.magnitudes.shape == other.magnitudes.shape) and
(np.all(self.magnitudes == other.magnitudes)))
@classmethod
def sum(cls, vectors: Sequence["VectorInBasis"]) -> "VectorInBasis":
return cls(vectors[0].basis_directions,
np.sum([x.magnitudes for x in vectors], axis=0))
@classmethod
def stack(cls,
vectors: Sequence["VectorInBasis"],
axis: int = 0) -> "VectorInBasis":
for v in vectors[1:]:
if v.basis_directions != vectors[0].basis_directions:
raise TypeError(f"Stacking incompatible bases: {vectors[0]} + {v}")
return cls(vectors[0].basis_directions,
np.stack([v.magnitudes for v in vectors], axis=axis))
def project(
self, basis: Union["VectorSpaceWithBasis", Sequence[BasisDirection]]
) -> "VectorInBasis":
"""Projects to the basis."""
if isinstance(basis, VectorSpaceWithBasis):
basis = basis.basis
components = []
for direction in basis:
if direction in self.basis_directions:
components.append(
self.magnitudes[..., self.basis_directions.index(direction)])
else:
components.append(np.zeros_like(self.magnitudes[..., 0]))
return VectorInBasis(list(basis), np.stack(components, axis=-1))
@dataclasses.dataclass
class VectorSpaceWithBasis:
"""A vector subspace in a given basis."""
basis: Sequence[BasisDirection]
def __post_init__(self):
"""Keep basis directions sorted."""
self.basis = sorted(self.basis)
@property
def num_dims(self) -> int:
return len(self.basis)
def __contains__(self, item: Union[VectorInBasis, BasisDirection]) -> bool:
if isinstance(item, BasisDirection):
return item in self.basis
return set(self.basis) == set(item.basis_directions)
def issubspace(self, other: "VectorSpaceWithBasis") -> bool:
return set(self.basis).issubset(set(other.basis))
def basis_vectors(self) -> Sequence[VectorInBasis]:
basis_vector_magnitudes = list(np.eye(self.num_dims))
return [VectorInBasis(self.basis, m) for m in basis_vector_magnitudes]
def vector_from_basis_direction(
self, basis_direction: BasisDirection) -> VectorInBasis:
i = self.basis.index(basis_direction)
return VectorInBasis(self.basis, np.eye(self.num_dims)[i])
def null_vector(self) -> VectorInBasis:
return VectorInBasis(self.basis, np.zeros(self.num_dims))
@classmethod
def from_names(cls, names: Sequence[Name]) -> "VectorSpaceWithBasis":
"""Creates a VectorSpace from a list of names for its basis directions."""
return cls([BasisDirection(n) for n in names])
@classmethod
def from_values(
cls,
name: Name,
values: Iterable[Value],
) -> "VectorSpaceWithBasis":
"""Creates a VectorSpace from a list of values for its basis directions."""
return cls([BasisDirection(name, v) for v in values])
def direct_sum(*vs: VectorSpaceWithBasis) -> VectorSpaceWithBasis:
"""Create a direct sum of the vector spaces.
Assumes the basis elements of all input vector spaces are
orthogonal to each other. Maintains the order of the bases.
Args:
*vs: the vector spaces to sum.
Returns:
the combined vector space.
Raises:
Value error in case of overlapping bases.
"""
# Take the union of all the bases:
total_basis = sum([v.basis for v in vs], [])
if len(total_basis) != len(set(total_basis)):
raise ValueError("Overlapping bases!")
return VectorSpaceWithBasis(total_basis)
def join_vector_spaces(*vs: VectorSpaceWithBasis) -> VectorSpaceWithBasis:
"""Joins a set of vector spaces allowing them to overlap.
Assumes the basis elements of all input vector spaces are
orthogonal to each other. Does not maintain the order of the bases but
sorts them.
Args:
*vs: the vector spaces to sum.
Returns:
the combined vector space.
"""
# Take the union of all the bases:
total_basis = list(set().union(*[set(v.basis) for v in vs]))
total_basis = sorted(total_basis)
return VectorSpaceWithBasis(total_basis)
def ensure_dims(
vs: VectorSpaceWithBasis,
num_dims: int,
name: str = "vector space",
) -> None:
"""Raises ValueError if vs has the wrong number of dimensions."""
if vs.num_dims != num_dims:
raise ValueError(f"{name} must have num_dims={num_dims}, "
f"but got {vs.num_dims}: {vs.basis}")