mctigger
diff --git a/‎README.md‎
Lines changed: 2 additions & 2 deletions b/‎README.md‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎docs/tensor_container.md‎
Lines changed: 308 additions & 0 deletions b/‎docs/tensor_container.md‎
Lines changed: 308 additions & 0 deletions
diff --git a/‎docs/tensor_distribution/development.md‎
Lines changed: 4 additions & 3 deletions b/‎docs/tensor_distribution/development.md‎
Lines changed: 4 additions & 3 deletions
diff --git a/‎src/tensorcontainer/distributions/__init__.py‎
Lines changed: 3 additions & 0 deletions b/‎src/tensorcontainer/distributions/__init__.py‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎src/tensorcontainer/distributions/symlog.py‎
Lines changed: 132 additions & 0 deletions b/‎src/tensorcontainer/distributions/symlog.py‎
Lines changed: 132 additions & 0 deletions
diff --git a/‎src/tensorcontainer/distributions/truncated_normal.py‎
Lines changed: 1 addition & 1 deletion b/‎src/tensorcontainer/distributions/truncated_normal.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/tensorcontainer/tensor_annotated.py‎
Lines changed: 3 additions & 7 deletions b/‎src/tensorcontainer/tensor_annotated.py‎
Lines changed: 3 additions & 7 deletions
diff --git a/‎src/tensorcontainer/tensor_container.py‎
Lines changed: 12 additions & 24 deletions b/‎src/tensorcontainer/tensor_container.py‎
Lines changed: 12 additions & 24 deletions
diff --git a/‎src/tensorcontainer/tensor_dataclass.py‎
Lines changed: 5 additions & 4 deletions b/‎src/tensorcontainer/tensor_dataclass.py‎
Lines changed: 5 additions & 4 deletions
@@ -2,9 +2,9 @@
 
 *Tensor containers for PyTorch with PyTree compatibility and torch.compile optimization*
 
-[![Python 3.9+](https://img.shields.io/badge/python-3.9+-blue.svg)](https://www.python.org/downloads/)
+[![Python 3.9, 3.10, 3.11, 3.12](https://img.shields.io/badge/python-3.10%20%7C%203.11%20%7C%203.11%20%7C%203.12-blue)](https://www.python.org/downloads/)
 [![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT)
-[![PyTorch](https://img.shields.io/badge/PyTorch-2.0+-red.svg)](https://pytorch.org/)
+[![PyTorch](https://img.shields.io/badge/PyTorch-2.6+-blue.svg)](https://pytorch.org/)
 
 > **⚠️ Academic Research Project**: This project exists solely for academic purposes to explore and learn PyTorch internals. For production use, please use the official, well-maintained [**torch/tensordict**](https://github.com/pytorch/tensordict) library.
 
 
@@ -26,13 +26,14 @@ All classes in [`tensorcontainer.tensor_distribution`](/src/tensorcontainer/tens
 
 Many `torch.distributions` constructors accept parameters of type `Union[Number, Tensor]` or any specialization of `Number` (e.g. `float`). However, [`TensorContainer`](/src/tensorcontainer/tensor_container.py) and [`TensorDistribution`](/src/tensorcontainer/tensor_distribution/base.py) can only process `Union[Tensor, TensorContainer]` objects and require all parameters to have compatible shapes for broadcasting.
 
-**Implementation Rule**: When the constructor signature contains `Union[Number, Tensor]` or any specialization of `Number` parameters, implementations **must** use `torch.distributions.utils.broadcast_all` to:
+**Implementation Rule**: When the constructor signature contains `Union[Number, Tensor]` or any specialization of `Number` parameters, implementations **must** use `tensorcontainer.tensor_distribution.utils.broadcast_all` to:
 1. Convert scalar numbers to tensors
 2. Broadcast all parameters to a common shape
 
+
 This preprocessing ensures proper shape and device management within the [`TensorAnnotated`](/src/tensorcontainer/tensor_annotated.py) framework.
 
-**Decision Criterion**: If the constructor signature does not contain `Union[Number, Tensor]` parameters, simpler parameter handling approaches should be preferred.
+**Decision Criterion**: If the constructor signature does not contain `Union[Number, Tensor]` parameters, simpler parameter handling approaches should be preferred. E.g. if it only contains a single argument of type `Tensor`, broadcasting is not necessary and should be avoided.
 
 ### Validation Strategy
 
@@ -46,7 +47,7 @@ This preprocessing ensures proper shape and device management within the [`Tenso
 
 Following the `torch.distributions.Distribution` pattern, basic distribution properties are provided through the [`TensorDistribution`](/src/tensorcontainer/tensor_distribution/base.py) base class via delegation to `self.dist()`.
 
-**Specialization Rule**: Distribution-specific properties **must** be implemented only in the corresponding subclass, maintaining the same delegation pattern to the underlying `torch.distributions` object.
+**Specialization Rule**: Distribution-specific properties (such as `logits` and `probs` in `Categorical`) **must** be implemented only in the corresponding subclass, maintaining the same delegation pattern to the underlying `torch.distributions` object.
 
 ## Implementation Patterns
 
 
@@ -0,0 +1,3 @@
+from .symlog import SymLogDistribution, SymexpTransform, symexp, symlog
+
+__all__ = ["SymLogDistribution", "SymexpTransform", "symexp", "symlog"]
@@ -0,0 +1,132 @@
+from __future__ import annotations
+
+import torch
+from torch.distributions import (
+    Normal,
+    Transform,
+    TransformedDistribution,
+    constraints,
+)
+from typing import Any
+
+
+def symlog(x: torch.Tensor) -> torch.Tensor:
+    """
+    Applies the symlog function element-wise.
+
+    symlog(x) = sign(x) * log(1 + |x|)
+    """
+    return torch.sign(x) * torch.log(1 + torch.abs(x))
+
+
+def symexp(x: torch.Tensor) -> torch.Tensor:
+    """
+    Applies the symexp function element-wise.
+
+    symexp(x) = sign(x) * (exp(|x|) - 1)
+    """
+    return torch.sign(x) * (torch.exp(torch.abs(x)) - 1)
+
+
+class SymexpTransform(Transform):
+    """
+    A bijective transform implementing the symexp function.
+
+    This transform is its own inverse, applying symlog. It is used to warp a
+    base distribution into a symlog-space.
+    """
+
+    def __init__(self) -> None:
+        super().__init__()
+        self.bijective = True
+        self.domain = constraints.real
+        self.codomain = constraints.real
+
+    def _call(self, x: torch.Tensor) -> torch.Tensor:
+        return symexp(x)
+
+    def _inverse(self, y: torch.Tensor) -> torch.Tensor:
+        return symlog(y)
+
+    def log_abs_det_jacobian(self, x: torch.Tensor, y: torch.Tensor) -> torch.Tensor:
+        # For y = symexp(x), dy/dx = exp(|x|)
+        # log|dy/dx| = log(exp(|x|)) = |x|
+        return torch.abs(x)
+
+    @property
+    def sign(self) -> int:
+        """The sign of the transform (always positive for symexp)."""
+        return 1
+
+
+class SymLogDistribution(TransformedDistribution):
+    """
+    A distribution that transforms a Normal distribution with a symexp transform.
+
+    This distribution is useful for modeling data with a wide dynamic range,
+    where the data can be both positive and negative, and can have values
+    close to zero. The symlog transform compresses large values and expands
+    small values, making the distribution more stable for optimization.
+
+    Args:
+        loc (torch.Tensor): The mean of the base Normal distribution.
+        scale (torch.Tensor): The standard deviation of the base Normal distribution.
+        validate_args (bool, optional): Whether to validate the arguments.
+            Defaults to None.
+    """
+
+    arg_constraints = {"loc": constraints.real, "scale": constraints.positive}
+
+    def __init__(
+        self,
+        loc: torch.Tensor,
+        scale: torch.Tensor,
+        validate_args: bool | None = None,
+    ) -> None:
+        self._loc = loc
+        self._scale = scale
+        base_dist = Normal(loc, scale)
+        super().__init__(base_dist, SymexpTransform(), validate_args=validate_args)
+
+    @property
+    def loc(self) -> torch.Tensor:
+        return self._loc
+
+    @property
+    def scale(self) -> torch.Tensor:
+        return self._scale
+
+    @property
+    def mean(self) -> torch.Tensor:
+        """Approximated by mode for now, as per instructions."""
+        return self.mode
+
+    @property
+    def mode(self) -> torch.Tensor:
+        """The mode of the distribution."""
+        return symexp(self._loc)
+
+    def expand(
+        self, batch_shape: Any, _instance: SymLogDistribution | None = None
+    ) -> SymLogDistribution:
+        """
+        Returns a new distribution instance with expanded batch shape.
+
+        Args:
+            batch_shape (Any): The new batch shape.
+            _instance (SymLogDistribution, optional): The instance to expand.
+                Defaults to None.
+
+        Returns:
+            SymLogDistribution: The expanded distribution.
+        """
+        new = self._get_checked_instance(SymLogDistribution, _instance)
+        batch_shape = torch.Size(batch_shape)
+        new._loc = self._loc.expand(batch_shape)
+        new._scale = self._scale.expand(batch_shape)
+        base_dist = Normal(new._loc, new._scale)
+        super(SymLogDistribution, new).__init__(
+            base_dist, SymexpTransform(), validate_args=False
+        )
+        new._validate_args = self._validate_args
+        return new
@@ -14,7 +14,7 @@ def __init__(
         high: Tensor,
         eps: float = 1e-6,
         validate_args=None,
-    ):
+    ) -> None:
         super().__init__(loc, scale, validate_args)
         self.low = low
         self.high = high
 
@@ -2,12 +2,12 @@
 
 from typing import Any, Iterable, TypeVar, Union, get_args
 
-import torch
 from torch import Tensor
 from torch.utils import _pytree as pytree
 from typing_extensions import Self
 
 from tensorcontainer.tensor_container import TensorContainer
+from tensorcontainer.types import DeviceLike, ShapeLike
 from tensorcontainer.utils import PytreeRegistered
 
 TDCompatible = Union[Tensor, TensorContainer]
@@ -18,12 +18,8 @@
 
 
 class TensorAnnotated(TensorContainer, PytreeRegistered):
-    def __init__(
-        self,
-        shape: torch.Size | list[int] | tuple[int, ...],
-        device: str | torch.device | int | None,
-    ):
-        super().__init__(shape, device, True)
+    def __init__(self, shape: ShapeLike, device: DeviceLike | None):
+        super().__init__(shape, device)
 
     @classmethod
     def _get_annotations(cls, base_cls):
 
@@ -5,26 +5,16 @@
 import threading
 from abc import abstractmethod
 from contextlib import contextmanager
-from typing import (
-    Any,
-    Callable,
-    Iterable,
-    List,
-    Optional,
-    Tuple,
-    Type,
-    Union,
-)
+from typing import Any, Callable, Iterable, List, Optional, Tuple, Type, Union
 
 import torch
 
-# Use the official PyTree utility from torch
 import torch.utils._pytree as pytree
 from torch import Tensor
-from torch._prims_common import DeviceLikeType, ShapeType
 from torch.utils._pytree import Context, KeyEntry, PyTree
 from typing_extensions import Self, TypeAlias
 
+from tensorcontainer.types import DeviceLike, ShapeLike
 from tensorcontainer.utils import resolve_device
 
 HANDLED_FUNCTIONS = {}
@@ -229,25 +219,23 @@ class MyContainer(TensorContainer, PytreeRegistered):
         >>> first_batch = container[0]           # Shape becomes (3,), events preserved
     """
 
-    shape: ShapeType
+    shape: torch.Size
     device: Optional[torch.device]
 
     # Thread-local storage for unsafe construction flag
     _validation_disabled = threading.local()
 
     def __init__(
         self,
-        shape: ShapeType,
-        device: Optional[DeviceLikeType],
-        validate_args: bool = True,
+        shape: ShapeLike,
+        device: DeviceLike | None,
     ):
         super().__init__()
 
-        self.shape = shape
-        self.device = None if device is None else torch.device(resolve_device(device))
+        self.shape = torch.Size(shape)
+        self.device = None if device is None else resolve_device(device)
 
-        if validate_args:
-            self._validate()
+        self._validate()
 
     @classmethod
     @contextmanager
@@ -378,7 +366,7 @@ def get_number_of_consuming_dims(self, item) -> int:
 
         return 1
 
-    def transform_ellipsis_index(self, shape: tuple[int, ...], idx: tuple) -> tuple:
+    def transform_ellipsis_index(self, shape: torch.Size, idx: tuple) -> tuple:
         """
         Transforms an indexing tuple with an ellipsis into an equivalent one without it.
         ...
@@ -465,7 +453,7 @@ def _format_item(key, value):
         # Assemble the final, properly formatted representation string
         return (
             f"{self.__class__.__name__}(\n"
-            f"{indent}shape={str(self.shape)},\n"
+            f"{indent}shape={tuple(self.shape)},\n"
             f"{indent}device={self.device},\n"
             f"{indent}items=\n{textwrap.indent(indented_items, indent)}\n{indent}\n"
             f")"
@@ -549,7 +537,7 @@ def __setitem__(self: Self, index: Any, value: Self) -> None:
                     v[processed_index] = k.get(value)
                 except Exception as e:
                     raise type(e)(
-                        f"Issue with key {str(k)} and index {processed_index} for value of shape {v.shape} and type {type(v)} and assignment of shape {value.shape}"
+                        f"Issue with key {str(k)} and index {processed_index} for value of shape {v.shape} and type {type(v)} and assignment of shape {tuple(value.shape)}"
                     ) from e
 
     def view(self: Self, *shape: int) -> Self:
@@ -753,7 +741,7 @@ def unsqueeze(self: Self, dim: int) -> Self:
 
     def size(self) -> torch.Size:
         """Returns the size of the batch dimensions."""
-        return torch.Size(self.shape)
+        return self.shape
 
     def dim(self) -> int:
         """Returns the number of batch dimensions."""
 
@@ -7,10 +7,11 @@
 
 import torch
 from torch import Tensor
+from tensorcontainer.types import DeviceLike, ShapeLike
 from typing_extensions import dataclass_transform
 
 from tensorcontainer.tensor_annotated import TensorAnnotated
-from tensorcontainer.tensor_container import ShapeType, TensorContainer
+from tensorcontainer.tensor_container import TensorContainer
 
 TDCompatible = Union[Tensor, TensorContainer]
 DATACLASS_ARGS = {"init", "repr", "eq", "order", "unsafe_hash", "frozen", "slots"}
@@ -184,8 +185,8 @@ class FinalData(ExtendedData):
     # can enable static analyzers to provide type hints in IDEs. Both are programmatically
     # added in __init_subclass__ so removing the following two lines will only remove the
     # type hints, but the class will stay functional.
-    shape: ShapeType
-    device: Optional[torch.device]
+    shape: ShapeLike
+    device: DeviceLike
 
     def __init_subclass__(cls, **kwargs):
         """Automatically convert subclasses into dataclasses with proper field inheritance.
@@ -215,7 +216,7 @@ def __init_subclass__(cls, **kwargs):
         annotations = cls._get_annotations(TensorDataClass)
 
         cls.__annotations__ = {
-            "shape": torch.Size,
+            "shape": ShapeLike,
             "device": Optional[torch.device],
             **annotations,
         }
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+from .symlog import SymLogDistribution, SymexpTransform, symexp, symlog`
	`2`	`+`
	`3`	`+__all__ = ["SymLogDistribution", "SymexpTransform", "symexp", "symlog"]`