Source code for syna.core

"""Core — Tensor and autograd primitives.

Core Tensor, Parameter, Config and autograd Function primitives used across
the syna library. This module contains the lightweight Tensor container and
the Function base class which implement forward/backward for automatic
differentiation.
"""

from __future__ import annotations

import contextlib
import weakref
from typing import Any, Optional

import numpy as np

import syna



[docs]
class Config:
    """Global config flags affecting backprop and training behavior."""

    enable_backprop = True
    train = True




[docs]
@contextlib.contextmanager
def using_config(name: str, value: bool):
    """Temporarily set a Config attribute inside a context."""
    old_value = getattr(Config, name)
    setattr(Config, name, value)
    try:
        yield
    finally:
        setattr(Config, name, old_value)




[docs]
def test_mode():
    """Context manager to set train flag to False."""
    return using_config("train", False)




[docs]
def no_grad():
    """Context manager to disable gradient tracking."""
    return using_config("enable_backprop", False)




[docs]
class Tensor:
    """Simple Tensor container holding data, gradient and creator Function.

    Most operator behavior delegates to syna.functions.* helpers so this class
    focuses on bookkeeping for autograd.
    """

    __array_priority__ = 200

    def __init__(self, data, name: Optional[str] = None) -> None:
        # normalize scalars/lists to numpy arrays
        if not isinstance(data, np.ndarray) and data is not None:
            data = as_array(data)
        self.data = data
        self.name = name
        self.grad: Optional[Tensor] = None
        self.creator: Optional[Function] = None
        self.generation: int = 0

    @property
    def shape(self):
        return self.data.shape

    @property
    def ndim(self):
        return self.data.ndim

    @property
    def size(self):
        return self.data.size

    @property
    def dtype(self):
        return self.data.dtype

    def __len__(self):
        return len(self.data)

    def __repr__(self):
        if self.data is None:
            return "tensor(None)"
        p = str(self.data).replace("\n", "\n" + " " * 7)
        return "tensor(" + p + ")"

    # arithmetic delegations
    def __add__(self, other):
        return syna.functions.add(self, other)

    def __radd__(self, other):
        return syna.functions.add(self, other)

    def __mul__(self, other):
        return syna.functions.mul(self, other)

    def __rmul__(self, other):
        return syna.functions.mul(self, other)

    def __neg__(self):
        return syna.functions.neg(self)

    def __sub__(self, other):
        return syna.functions.sub(self, other)

    def __rsub__(self, other):
        return syna.functions.sub(other, self)

    def __truediv__(self, other):
        return syna.functions.div(self, other)

    def __rtruediv__(self, other):
        return syna.functions.div(other, self)

    def __pow__(self, other):
        return syna.functions.pow(self, other)

    def __getitem__(self, other):
        return syna.functions.get_item(self, other)


[docs]
    def max(self, **kwargs):
        return syna.functions.max(self, **kwargs)



[docs]
    def min(self, **kwargs):
        return syna.functions.min(self, **kwargs)



[docs]
    def set_creator(self, func: Function) -> None:
        """Mark this tensor as created by func (used for backprop ordering)."""
        self.creator = func
        self.generation = func.generation + 1



[docs]
    def unchain(self) -> None:
        """Remove reference to creator to break the computational graph."""
        self.creator = None



[docs]
    def cleargrad(self) -> None:
        """Clear stored gradient."""
        self.grad = None



[docs]
    def backward(self, retain_grad=False, create_graph=False) -> None:
        """Run backpropagation to compute gradients of inputs.

        Args:
            retain_grad: if False, intermediate gradients are cleared to save memory.
            create_graph: if True, create graph for higher-order gradients.
        """
        if self.grad is None:
            self.grad = Tensor(np.ones_like(self.data))

        funcs: list[Function] = []
        seen_set = set()

        def add_func(f: Function) -> None:
            if f not in seen_set:
                funcs.append(f)
                seen_set.add(f)
                funcs.sort(key=lambda x: x.generation)

        if self.creator is None:
            return  # nothing to backprop

        add_func(self.creator)

        while funcs:
            f = funcs.pop()
            gys = [output().grad for output in f.outputs]
            gxs = f.backward(*gys)
            with using_config("enable_backprop", create_graph):
                if not isinstance(gxs, tuple):
                    gxs = (gxs,)
                for x, gx in zip(f.inputs, gxs):
                    if x.grad is None:
                        x.grad = gx
                    else:
                        x.grad = x.grad + gx
                    if x.creator is not None:
                        add_func(x.creator)
            if not retain_grad:
                for y in f.outputs:
                    y().grad = None



[docs]
    def unchain_backward(self):
        """Remove creators for all upstream tensors (useful for freeing graph)."""
        if self.creator is not None:
            funcs = [self.creator]
            while funcs:
                f = funcs.pop()
                for x in f.inputs:
                    if x.creator is not None:
                        funcs.append(x.creator)
                        x.unchain()



[docs]
    def reshape(self, *shape: int):
        if len(shape) == 1 and isinstance(shape[0], (tuple, list)):
            shape = shape[0]
        return syna.functions.reshape(self, shape)



[docs]
    def transpose(self, *axes: int):
        if len(axes) == 0:
            axes = None
        elif len(axes) == 1:
            if isinstance(axes[0], (tuple, list)) or axes[0] is None:
                axes = axes[0]
        return syna.functions.transpose(self, axes)



[docs]
    def sum(self, axis=None, keepdims=False):
        return syna.functions.sum(self, axis, keepdims)


    @property
    def T(self):
        return syna.functions.transpose(self)




[docs]
class Parameter(Tensor):
    """A thin wrapper for trainable parameters (keeps API separate)."""

    pass




[docs]
def tensor(
    data, dtype=None, requires_grad: bool = False, name: Optional[str] = None
) -> Tensor:
    """Tensor factory.

    Args:
        data: array-like or scalar.
        dtype: numpy dtype (optional).
        requires_grad: if True, the returned Tensor is a leaf that will accumulate gradients.
        name: optional name for the Tensor.
    """
    arr = np.array(data, dtype=dtype) if dtype is not None else np.array(data)
    if requires_grad:
        return Tensor(arr, name=name)
    else:
        with no_grad():
            return Tensor(arr, name=name)




[docs]
def as_tensor(obj) -> Tensor:
    """Ensure obj is a Tensor; convert scalars/arrays to Tensor if needed.

    Delegates to tensor(...), which follows PyTorch-style semantics.
    """
    if isinstance(obj, Tensor):
        return obj
    return tensor(obj)




[docs]
def as_array(x) -> np.ndarray:
    """Convert scalars to numpy arrays; leave arrays unchanged."""
    if np.isscalar(x):
        return np.array(x)
    return x



# Random and utility tensor factories (torch-like)
def _normalize_shape_args(shape_args):
    if len(shape_args) == 1 and isinstance(shape_args[0], (tuple, list)):
        return tuple(shape_args[0])
    return tuple(shape_args)



[docs]
def rand(
    *shape, dtype=None, requires_grad: bool = False, name: Optional[str] = None
) -> Tensor:
    """Return a tensor with uniform random values in [0, 1)."""
    shape = _normalize_shape_args(shape)
    arr = np.random.rand(*shape)
    if dtype is not None:
        arr = arr.astype(dtype)
    return tensor(arr, requires_grad=requires_grad, name=name)




[docs]
def randn(
    *shape, dtype=None, requires_grad: bool = False, name: Optional[str] = None
) -> Tensor:
    """Return a tensor with samples from the standard normal distribution."""
    shape = _normalize_shape_args(shape)
    arr = np.random.randn(*shape)
    if dtype is not None:
        arr = arr.astype(dtype)
    return tensor(arr, requires_grad=requires_grad, name=name)




[docs]
def zeros(
    *shape, dtype=None, requires_grad: bool = False, name: Optional[str] = None
) -> Tensor:
    """Return a tensor filled with zeros."""
    shape = _normalize_shape_args(shape)
    arr = np.zeros(shape, dtype=dtype)
    return tensor(arr, requires_grad=requires_grad, name=name)




[docs]
def ones(
    *shape, dtype=None, requires_grad: bool = False, name: Optional[str] = None
) -> Tensor:
    """Return a tensor filled with ones."""
    shape = _normalize_shape_args(shape)
    arr = np.ones(shape, dtype=dtype)
    return tensor(arr, requires_grad=requires_grad, name=name)




[docs]
def full(
    shape,
    fill_value,
    dtype=None,
    requires_grad: bool = False,
    name: Optional[str] = None,
) -> Tensor:
    """Return a tensor of shape `shape` filled with `fill_value`.

    `shape` may be an int or a tuple/list of ints (matches numpy/torch style).
    """
    # normalize shape to tuple
    if isinstance(shape, (tuple, list)):
        shape = tuple(shape)
    else:
        try:
            # allow ints-like
            shape = (int(shape),)
        except Exception:
            # fallback: try to treat as array-like and use its shape
            shape = tuple(np.array(shape).shape)
    arr = np.full(shape, fill_value, dtype=dtype)
    return tensor(arr, requires_grad=requires_grad, name=name)




[docs]
def arange(
    start,
    stop=None,
    step=1,
    dtype=None,
    requires_grad: bool = False,
    name: Optional[str] = None,
) -> Tensor:
    """Return a 1-D tensor with values from start to stop (exclusive)."""
    if stop is None:
        arr = np.arange(start, dtype=dtype, step=step)
    else:
        arr = np.arange(start, stop, step=step, dtype=dtype)
    return tensor(arr, requires_grad=requires_grad, name=name)




[docs]
def randint(
    low,
    high=None,
    size=None,
    dtype=None,
    requires_grad: bool = False,
    name: Optional[str] = None,
) -> Tensor:
    """Return random integers from low (inclusive) to high (exclusive)."""
    arr = np.random.randint(low, high=high, size=size)
    if dtype is not None:
        arr = arr.astype(dtype)
    return tensor(arr, requires_grad=requires_grad, name=name)




[docs]
def eye(
    n, m=None, dtype=None, requires_grad: bool = False, name: Optional[str] = None
) -> Tensor:
    """Return a 2-D identity matrix (or rectangular identity if m is given)."""
    arr = np.eye(N=n, M=m, dtype=dtype) if m is not None else np.eye(N=n, dtype=dtype)
    return tensor(arr, requires_grad=requires_grad, name=name)




[docs]
def zeros_like(
    x, dtype=None, requires_grad: bool = False, name: Optional[str] = None
) -> Tensor:
    """Return a tensor of zeros with the same shape as x (Tensor or array-like)."""
    if isinstance(x, Tensor):
        shape = x.shape
        use_dtype = dtype if dtype is not None else x.dtype
    else:
        arr_like = np.array(x)
        shape = arr_like.shape
        use_dtype = dtype if dtype is not None else arr_like.dtype
    arr = np.zeros(shape, dtype=use_dtype)
    return tensor(arr, requires_grad=requires_grad, name=name)




[docs]
def ones_like(
    x, dtype=None, requires_grad: bool = False, name: Optional[str] = None
) -> Tensor:
    """Return a tensor of ones with the same shape as x (Tensor or array-like)."""
    if isinstance(x, Tensor):
        shape = x.shape
        use_dtype = dtype if dtype is not None else x.dtype
    else:
        arr_like = np.array(x)
        shape = arr_like.shape
        use_dtype = dtype if dtype is not None else arr_like.dtype
    arr = np.ones(shape, dtype=use_dtype)
    return tensor(arr, requires_grad=requires_grad, name=name)




[docs]
def full_like(
    x, fill_value, dtype=None, requires_grad: bool = False, name: Optional[str] = None
) -> Tensor:
    """Return a tensor with the same shape as `x` filled with `fill_value`.

    `x` may be a `Tensor` or array-like.
    """
    if isinstance(x, Tensor):
        shape = x.shape
        use_dtype = dtype if dtype is not None else x.dtype
    else:
        arr_like = np.array(x)
        shape = arr_like.shape
        use_dtype = dtype if dtype is not None else arr_like.dtype
    arr = np.full(shape, fill_value, dtype=use_dtype)
    return tensor(arr, requires_grad=requires_grad, name=name)




[docs]
def range(
    start,
    stop=None,
    step=1,
    dtype=None,
    requires_grad: bool = False,
    name: Optional[str] = None,
) -> Tensor:
    """Alias for arange to match torch.range-like convenience (behaves like arange)."""
    return arange(
        start, stop=stop, step=step, dtype=dtype, requires_grad=requires_grad, name=name
    )




[docs]
class Function:
    """Base Function for forward/backward ops used in autograd.

    Subclasses should implement forward (numpy arrays -> numpy arrays) and
    backward (Tensor grads -> Tensor grads).
    """

    def __call__(self, *input: Tensor | np.ndarray | int | float) -> Any:
        inputs = [as_tensor(x) if x is not None else Tensor(x) for x in input]
        xs = [x.data for x in inputs]
        ys = self.forward(*xs)
        if not isinstance(ys, tuple):
            ys = (ys,)
        outputs = [as_tensor(y) for y in ys]

        if Config.enable_backprop:
            self.generation = max(x.generation for x in inputs) if inputs else 0
            for output in outputs:
                output.set_creator(self)
            self.inputs = inputs
            self.outputs = [weakref.ref(output) for output in outputs]

        return outputs[0] if len(outputs) == 1 else outputs


[docs]
    def forward(self, *args: np.ndarray) -> np.ndarray:
        raise NotImplementedError()



[docs]
    def backward(self, *args: Tensor) -> Tensor | list[Tensor]:
        raise NotImplementedError()