Source code for boundlab.expr._core

r"""Core Expression Classes

This module defines the base expression class and flags used throughout
the expression framework.
"""

from copy import copy
import itertools
import sys
from typing import Callable, Literal, Optional, Union

import torch
import enum

from boundlab import utils
from boundlab.linearop import ScalarOp
from boundlab.linearop._base import LinearOp
from boundlab.prop import ub



[docs]
class ExprFlags(enum.Flag):
    """Flags indicating expression properties for optimization."""
    NONE = 0
    SYMMETRIC_TO_0 = enum.auto()
    """The feasible region is symmetric about zero."""
    PRINT_FUSE = enum.auto()
    """Expression should be fused with parent when printing."""
    IS_CONST = enum.auto()
    """Expression represents a constant value."""
    IS_AFFINE = enum.auto()
    """Expression represents an affine transformation of its inputs."""


_EXPR_ID_COUNTER = itertools.count()


[docs]
class Expr:
    """Abstract base class for all symbolic expressions in BoundLab.

    Each expression represents a node in a directed acyclic graph (DAG) of
    computations. Expressions are immutable after construction, and each
    instance is assigned a unique time-ordered UUID to enable deterministic
    topological ordering during bound propagation.

    Subclasses must implement :attr:`shape`, :attr:`children`, and
    :meth:`backward` to define the expression's semantics.
    """

    id: int
    """Unique identifier for the expression, used for topological sorting."""
    flags: ExprFlags
    """Flags indicating expression properties for optimization."""


[docs]
    def __init__(self, flags: ExprFlags = ExprFlags.NONE):
        self.id = next(_EXPR_ID_COUNTER)
        self.flags = flags

    

[docs]
    def with_children(self, *new_children: "Expr") -> "Expr":
        """Return a new expression with the same type and flags but new children."""
        raise NotImplementedError(f"The :code:`with_children` method is not implemented for {self.__class__.__name__}.")


    @property
    def shape(self) -> torch.Size:
        """The shape of the output(s) produced by this expression."""
        raise NotImplementedError(f"The :code:`shape` property is not implemented for {self.__class__.__name__}.")

    @property
    def children(self) -> tuple["Expr", ...]:
        """The child expressions that serve as inputs to this expression."""
        raise NotImplementedError(f"The :code:`children` property is not implemented for {self.__class__.__name__}.")


[docs]
    def backward(self, weights: LinearOp, direction: Literal[">=", "<=", "=="] = "==") \
            -> tuple[torch.Tensor, list[LinearOp]] | None:
        r"""Perform backward-mode bound propagation through this expression.

        Given an accumulated weight ``weights`` (usually a 
        :class:`~boundlab.linearop.EinsumOp`) from the output back to this
        node, backward propagation derives child weights and a bias:

        .. math::

            \mathbf{w}^\top f(x_1, \ldots, x_n)
            \;\square\; b + \sum_i \mathbf{w}_i^\top x_i

        Args:
            weights: A :class:`~boundlab.linearop.EinsumOp` accumulated
                weight from the root expression to this node.
            direction: Bound direction — ``">="`` (lower), ``"<="`` (upper),
                or ``"=="`` (exact).

        Returns:
            A tuple ``(bias, child_weights)`` where ``bias`` is a
            :class:`torch.Tensor` or ``0``, and ``child_weights`` is a list
            of :class:`~boundlab.linearop.EinsumOp` (one per child).
            Returns ``None`` if this expression cannot contribute to the bound
            in the given direction.
        """
        raise NotImplementedError(f"The :code:`backward` method is not implemented for {self.__class__.__name__}.")



[docs]
    def to_string(self, *children_str: str) -> str:
        """Return string representation with child strings substituted."""
        return f"{self.__class__.__name__}({', '.join(children_str)})"


    def _metric(self) -> float:
        width = self.bound_width()
        index = width.argmax()
        indices = torch.unravel_index(index, width.shape)
        return width.max(), self.center()[indices].item()

    def __repr__(self):
        output = []
        w, w_c = self._metric()

        output.append(f"max={w:.4g}/{w_c:.4g}")
        output.append(f"mean={self.bound_width().mean().item():.4g}/{self.center().mean().item():.4g}")
        li = list(self.uncertainty_reasons().items())
        li.sort(key=lambda x: x[1], reverse=True)
        for k, v in li[:3]:
            output.append(f"{k}={v:.4e}")
        return f"Expr({','.join(output)})"
    
    def __str__(self):
        return "bl.Expr {\n" + expr_pretty_print(self, indent=4) + "\n}"

    # ------------------------------------------------------------------
    # Arithmetic operators — all produce Linear with EinsumOp ops
    # ------------------------------------------------------------------


[docs]
    def __add__(self, other):
        from boundlab.expr._affine import AffineSum, ConstVal
        if isinstance(other, ConstVal):
            other = other.value
        if isinstance(other, int) and other == 0:
            return self
        if isinstance(other, torch.Tensor):
            if other.shape != self.shape:
                other = other.expand(self.shape)
            other = ConstVal(other)
        if isinstance(other, Expr):
            assert self.shape == other.shape, f"Shape mismatch for addition: {self.shape} vs {other.shape}"
            return AffineSum((ScalarOp(1.0, self.shape), self), (ScalarOp(1.0, other.shape), other))
        return NotImplemented


    def __radd__(self, other):
        from boundlab.expr._affine import AffineSum, ConstVal
        if isinstance(other, ConstVal):
            other = other.value
        if isinstance(other, int) and other == 0:
            return self
        if isinstance(other, torch.Tensor):
            if other.shape != self.shape:
                other = other.expand(self.shape)
            other = ConstVal(other)
        if isinstance(other, Expr):
            return AffineSum((ScalarOp(1.0, other.shape), other), (ScalarOp(1.0, self.shape), self))
        return NotImplemented

    def __neg__(self):
        from boundlab.expr._affine import AffineSum, ConstVal
        from boundlab.linearop import EinsumOp
        return AffineSum((ScalarOp(-1.0, self.shape), self))

    def __sub__(self, other):
        from boundlab.expr._affine import AffineSum, ConstVal
        if isinstance(other, ConstVal):
            other = other.value
        if isinstance(other, Expr):
            return self + (-other)
        if isinstance(other, torch.Tensor):
            return self + (-other)
        return NotImplemented

    def __rsub__(self, other):
        from boundlab.expr._affine import AffineSum, ConstVal
        if isinstance(other, ConstVal):
            other = other.value
        if isinstance(other, Expr):
            return other + (-self)
        if isinstance(other, torch.Tensor):
            return other + (-self)
        return NotImplemented


[docs]
    def __mul__(self, other):
        """Element-wise multiplication (no broadcast)."""
        from boundlab.expr._affine import AffineSum, ConstVal
        if isinstance(other, ConstVal):
            other = other.value
            
        from boundlab.linearop import EinsumOp, ScalarOp
        if isinstance(other, (int, float)):
            return AffineSum((ScalarOp(float(other), self.shape), self))
        if isinstance(other, torch.Tensor):
            if other.dim() == 0:
                return AffineSum((ScalarOp(float(other.item()), self.shape), self))
            return AffineSum((EinsumOp.from_hardmard(other, len(self.shape)), self))
        return NotImplemented


    def __rmul__(self, other):
        """Element-wise multiplication (no broadcast)."""
        from boundlab.expr._affine import AffineSum, ConstVal
        if isinstance(other, ConstVal):
            other = other.value

        from boundlab.linearop import EinsumOp, ScalarOp
        if isinstance(other, (int, float)):
            return AffineSum((ScalarOp(float(other), self.shape), self))
        if isinstance(other, torch.Tensor):
            if other.dim() == 0:
                return AffineSum((ScalarOp(float(other.item()), self.shape), self))
            return AffineSum((EinsumOp.from_hardmard(other, len(self.shape)), self))
        return NotImplemented

    def __truediv__(self, other):
        """Division by a scalar or tensor."""
        from boundlab.expr._affine import AffineSum, ConstVal
        if isinstance(other, ConstVal):
            other = other.value
    

        if isinstance(other, (int, float)):
            return self * (1.0 / other)
        if isinstance(other, torch.Tensor):
            if len(self.shape) == 0 and other.dim() > 0:
                return self.expand(*list(other.shape)) * (1.0 / other)
            if other.dim() > 0 and tuple(self.shape) != tuple(other.shape):
                other = other.expand(*list(self.shape))
            return self * (1.0 / other)
        return NotImplemented

    def __matmul__(self, other):
        """Matrix multiply: self @ other. Supports batched matmul."""
        from boundlab.expr._affine import AffineSum, ConstVal
        if isinstance(other, ConstVal):
            other = other.value

        from boundlab.linearop import EinsumOp
        if isinstance(other, torch.Tensor) and len(other.shape) >= 2:
            assert self.shape[-1] == other.shape[-2], \
                f"Inner dims must match: {self.shape} @ {other.shape}"
            if len(self.shape) == 1:
                K = self.shape[0]
                batch_t = other.shape[:-2]
                S2 = other.shape[-1]
                nb = len(batch_t)
                input_dims = [nb]
                output_dims = list(range(nb)) + [nb + 1]
                return AffineSum((EinsumOp(other, input_dims, output_dims), self))
            batch_s = self.shape[:-2]
            batch_t = other.shape[:-2]
            S, D, S2 = self.shape[-2], self.shape[-1], other.shape[-1]
            batch = torch.broadcast_shapes(batch_s, batch_t) if (batch_s and batch_t) else (batch_s or batch_t)
            nb = len(batch)
            other_b = other.expand(*batch, D, S2)
            tensor = other_b.unsqueeze(nb).expand(*batch, S, D, S2)
            ns = len(self.shape)
            input_dims = list(range(nb + 2))[-ns:]
            output_dims = list(range(nb + 1)) + [nb + 2]
            return AffineSum((EinsumOp(tensor, input_dims, output_dims), self))
        return NotImplemented

    def __rmatmul__(self, other):
        """Matrix multiply: other @ self. Supports batched matmul."""
        from boundlab.expr._affine import AffineSum, ConstVal
        if isinstance(other, ConstVal):
            other = other.value
            
        from boundlab.linearop import EinsumOp
        if isinstance(other, torch.Tensor) and len(other.shape) >= 2:
            M, K = other.shape[-2], other.shape[-1]
            batch_t = other.shape[:-2]
            if len(self.shape) == 1:
                assert self.shape[0] == K, f"Inner dims must match: {other.shape} @ {self.shape}"
                nb = len(batch_t)
                input_dims = [nb + 1]
                output_dims = list(range(nb + 1))
                return AffineSum((EinsumOp(other, input_dims, output_dims), self))
            assert self.shape[-2] == K, f"Inner dims must match: {other.shape} @ {self.shape}"
            N = self.shape[-1]
            batch_s = self.shape[:-2]
            batch = torch.broadcast_shapes(batch_t, batch_s) if (batch_t and batch_s) else (batch_t or batch_s)
            nb = len(batch)
            other_b = other.expand(*batch, M, K)
            tensor = other_b.unsqueeze(-1).expand(*batch, M, K, N)
            input_dims = list(range(nb))[-len(batch_s):] + [nb + 1, nb + 2] if batch_s else [nb + 1, nb + 2]
            output_dims = list(range(nb + 1)) + [nb + 2]
            return AffineSum((EinsumOp(tensor, input_dims, output_dims), self))
        return NotImplemented
    

    # ------------------------------------------------------------------
    # Shape / indexing operators — produce Linear with generic LinearOp
    # ------------------------------------------------------------------

    def _apply_op(self, op):
        """Wrap a LinearOp as an AffineSum expression."""
        from boundlab.expr._affine import AffineSum
        return AffineSum((op, self))


[docs]
    def reshape(self, *shape) -> "Expr":
        from boundlab.linearop import ReshapeOp
        return self._apply_op(ReshapeOp(self.shape, shape))



[docs]
    def permute(self, *dims) -> "Expr":
        from boundlab.linearop import PermuteOp
        return self._apply_op(PermuteOp(self.shape, dims))



[docs]
    def transpose(self, dim0, dim1) -> "Expr":
        from boundlab.linearop import TransposeOp
        return self._apply_op(TransposeOp(self.shape, dim0, dim1))

    
    @property
    def T(self) -> "Expr":
        """Convenience for transpose of the last two dimensions."""
        if len(self.shape) < 2:
            raise ValueError(f"Cannot transpose last two dimensions of shape {self.shape} with less than 2 dims.")
        return self.transpose(len(self.shape) - 2, len(self.shape) - 1)


[docs]
    def flatten(self, start_dim=0, end_dim=-1) -> "Expr":
        from boundlab.linearop import FlattenOp
        return self._apply_op(FlattenOp(self.shape, start_dim, end_dim))



[docs]
    def unflatten(self, dim, sizes) -> "Expr":
        from boundlab.linearop import UnflattenOp
        return self._apply_op(UnflattenOp(self.shape, dim, sizes))



[docs]
    def squeeze(self, dim=None) -> "Expr":
        from boundlab.linearop import SqueezeOp
        return self._apply_op(SqueezeOp(self.shape, dim))



[docs]
    def unsqueeze(self, dim) -> "Expr":
        from boundlab.linearop import UnsqueezeOp
        return self._apply_op(UnsqueezeOp(self.shape, dim))



[docs]
    def narrow(self, dim, start, length) -> "Expr":
        from boundlab.linearop import NarrowOp
        return self._apply_op(NarrowOp(self.shape, dim, start, length))



[docs]
    def expand(self, *sizes) -> "Expr":
        from boundlab.linearop import ExpandOp, UnsqueezeOp
        n_new = len(sizes) - len(self.shape)
        result = self
        # Add leading size-1 dims if needed
        for _ in range(n_new):
            result = result.unsqueeze(0)
        return result._apply_op(ExpandOp(result.shape, torch.Size(sizes)))

    

[docs]
    def expand_on(self, dim, size) -> "Expr":
        from boundlab.linearop import ExpandOp
        sizes = list(self.shape)
        assert sizes[dim] == 1, f"Can only expand on size-1 dim, but dim {dim} has size {sizes[dim]}"
        sizes[dim] = size
        return self._apply_op(ExpandOp(self.shape, torch.Size(sizes)))



[docs]
    def repeat(self, *sizes) -> "Expr":
        from boundlab.linearop import RepeatOp
        return self._apply_op(RepeatOp(self.shape, sizes))



[docs]
    def tile(self, *sizes) -> "Expr":
        from boundlab.linearop import TileOp
        return self._apply_op(TileOp(self.shape, sizes))



[docs]
    def flip(self, dims) -> "Expr":
        from boundlab.linearop import FlipOp
        return self._apply_op(FlipOp(self.shape, dims))



[docs]
    def roll(self, shifts, dims) -> "Expr":
        from boundlab.linearop import RollOp
        return self._apply_op(RollOp(self.shape, shifts, dims))



[docs]
    def diag(self, diagonal=0) -> "Expr":
        from boundlab.linearop import DiagOp
        return self._apply_op(DiagOp(self.shape, diagonal))


    def __getitem__(self, indices) -> "Expr":
        from boundlab.linearop import GetItemOp
        if not isinstance(indices, tuple):
            indices = (indices,)
        for i in range(len(indices)):
            if isinstance(indices[i], torch.Tensor) and indices[i].dtype in [torch.int, torch.long, torch.int32, torch.int64]:
                if indices[i].dim() == 0:
                    indices = (*indices[:i], int(indices[i].item()), *indices[i+1:])
                else:
                    raise ValueError(f"Index tensors must be 0-dimensional (scalars), but index {i} has shape {indices[i].shape}")
        if all(isinstance(idx, slice) or isinstance(idx, int) for idx in indices):
            return self._apply_op(GetItemOp(self.shape, indices))
        raise ValueError("Invalid indices for item selection")


[docs]
    def zeros_set(self, output_shape) -> Callable[[tuple], "Expr"]:
        from boundlab.linearop import SetSliceOp, make_set_slices, get_int_dims, UnsqueezeOp
        def zeros_set(indices):
            if not isinstance(indices, tuple):
                indices = (indices,)
            if all(isinstance(idx, slice) or isinstance(idx, int) for idx in indices):
                int_dims = get_int_dims(indices)
                # First unsqueeze for any int dims (they will be embedded as length-1)
                expr = self
                for i, dim in enumerate(sorted(int_dims)):
                    adjusted_dim = dim - i
                    expr = expr.unsqueeze(adjusted_dim)
                # Now make the slices for the full-dim version
                slices = make_set_slices(output_shape, indices)
                return expr._apply_op(SetSliceOp(output_shape, slices))
            else:
                raise ValueError("Invalid indices for zero setting")
        return zeros_set

    

[docs]
    def scatter(self, indices, output_shape) -> "Expr":
        from boundlab.linearop import ScatterOp
        return self._apply_op(ScatterOp(indices, self.shape, output_shape))

    

[docs]
    def gather(self, indices, dim: int = 0) -> "Expr":
        from boundlab.linearop import GatherOp
        return self._apply_op(GatherOp(self.shape, dim, indices))


    def _normalize_reduce_dims(self, dim: Union[int, tuple[int, ...], list[int], torch.Tensor, None]) -> tuple[int, ...]:
        rank = len(self.shape)
        if dim is None:
            return tuple(range(rank))
        if isinstance(dim, int):
            dims = (dim,)
        elif isinstance(dim, torch.Tensor):
            dims = tuple(int(d) for d in dim.flatten().tolist())
        else:
            dims = tuple(int(d) for d in dim)

        normalized: list[int] = []
        for d in dims:
            d0 = d + rank if d < 0 else d
            if d0 < 0 or d0 >= rank:
                raise IndexError(f"Reduction dim {d} out of range for shape {tuple(self.shape)}")
            if d0 not in normalized:
                normalized.append(d0)
        return tuple(sorted(normalized))


[docs]
    def sum(self, dim: Union[int, tuple[int, ...], list[int], torch.Tensor, None] = None, keepdim: bool = False) -> "Expr":
        from boundlab.linearop import EinsumOp

        dims = self._normalize_reduce_dims(dim)
        if len(dims) == 0:
            return self
        
        if not keepdim:
            weights = torch.ones(self.shape)
            input_dims = list(range(len(self.shape)))
            output_dims = [i for i in input_dims if i not in dims]
            op = EinsumOp(weights, input_dims=input_dims, output_dims=output_dims)
            return self._apply_op(op)
        else:
            # Build EinsumOp that keeps reduced dims as size 1 directly,
            # avoiding the sum+unsqueeze composition bug.
            # Weight shape: insert size-1 dims at reduced positions in output
            ndim = len(self.shape)
            # weight tensor has the full input shape
            weights = torch.ones(self.shape)
            input_dims = list(range(ndim))
            # output_dims: same as input but reduced dims point to
            # dedicated size-1 output dims appended after the input dims
            output_dims = []
            next_extra = ndim
            for i in range(ndim):
                if i in dims:
                    # Add a size-1 dim to the weight tensor for this output position
                    weights = weights.unsqueeze(next_extra)
                    output_dims.append(next_extra)
                    next_extra += 1
                else:
                    output_dims.append(i)
            op = EinsumOp(weights, input_dims=input_dims, output_dims=output_dims)
            return self._apply_op(op)



[docs]
    def mean(self, dim: Union[int, tuple[int, ...], list[int], torch.Tensor, None] = None, keepdim: bool = False) -> "Expr":
        reduce_dims = self._normalize_reduce_dims(dim)
        if len(reduce_dims) == 0:
            return self

        denom = 1
        for d in reduce_dims:
            denom *= int(self.shape[d])
        return self.sum(dim=reduce_dims, keepdim=keepdim) / float(denom)


    # ------------------------------------------------------------------
    # Bound computation helpers
    # ------------------------------------------------------------------


[docs]
    def ub(self) -> torch.Tensor:
        """Compute an upper bound for this expression."""
        from boundlab import prop
        return prop.ub(self)



[docs]
    def lb(self) -> torch.Tensor:
        """Compute a lower bound for this expression."""
        from boundlab import prop
        return prop.lb(self)



[docs]
    def ublb(self) -> tuple[torch.Tensor, torch.Tensor]:
        """Compute both an upper bound and a lower bound for this expression."""
        from boundlab import prop
        return prop.ublb(self)



[docs]
    def center(self) -> torch.Tensor:
        """Compute the center of the bounds for this expression."""
        from boundlab import prop
        return prop.center(self)



[docs]
    def bound_width(self) -> torch.Tensor:
        """Compute the width of the bounds for this expression."""
        from boundlab import prop
        return prop.bound_width(self)



[docs]
    def max_bound_width(self) -> torch.Tensor:
        """Compute the maximum width across all output dimensions."""
        from boundlab import prop
        return prop.max_bound_width(self)

    

[docs]
    def bound_width_reasons_breakdown(self) -> dict[str, torch.Tensor]:
        """Compute the breakdown of the bound width by reason."""
        from boundlab import prop
        return prop.bound_width_reasons_breakdown(self)

    

[docs]
    def uncertainty_reasons(self) -> dict[str, float]:
        """Compute the breakdown of the bound width by reason, aggregated to total contributions."""
        width = self.bound_width()
        index = width.argmax()
        indices = torch.unravel_index(index, width.shape)
        breakdown = self[*indices].bound_width_reasons_breakdown()
        return {reason: float(tensor.item()) for reason, tensor in breakdown.items()}

    

[docs]
    def get_const(self):
        """Return the concrete tensor if *self* is a pure constant expression, else None.

        Works for :class:`~boundlab.expr.ConstVal` and any :class:`~boundlab.expr.AffineSum`
        that has no symbolic children.
        """
        return None

    

[docs]
    def simplify_ops_(self):
        """Recursively compute simplified ops for affine expressions."""
        for child in self.children:
            child.simplify_ops_()



[docs]
    def is_symmetric_to_0(self) -> bool:
        """Return True if this expression is symmetric about zero, else False."""
        return bool(self.flags & ExprFlags.SYMMETRIC_TO_0)



[docs]
    def split_const(self) -> tuple["Expr | 0", "Expr | 0"]:
        """Decompose this expression into a constant part and a zero-constant part.

        If the expression is symmetric about zero, the constant part is zero.
        If the expression is a pure constant, the zero-constant part is zero.

        Returns:
            A tuple ``(non_const_part, const_part)`` where exactly one of the two is zero.
        """
        raise NotImplementedError(f"The :code:`split_const` method is not implemented for {self.__class__.__name__}.")

    

[docs]
    def all_subnodes(self) -> list[Union["Expr", "TupleExpr"]]:
        """Return a list of all sub-expressions in the DAG rooted at this expression, in topological order."""
        visited = list()

        from boundlab.expr import TupleExpr, GetTupleItem

        def dfs(e: Union[Expr, TupleExpr]):
            if e in visited:
                return
            visited.append(e)
            for child in e.children:
                dfs(child)
        dfs(self)

        visited.sort(key=lambda e: e.id)
        return visited

    

[docs]
    def replace_subnode_once(self, replace_fn: Callable[["Expr"], Optional["Expr"]]) -> "Expr":
        """Return a new expression with the same structure but sub-expressions replaced by replace_fn."""
        visited = self.all_subnodes()
        for i, e in reversed(list(enumerate(visited))):
            new_e = replace_fn(e)
            if new_e is not None:
                new_visited = copy(visited)
                new_visited[i] = new_e
                for j in range(i + 1, len(visited)):
                    parent = visited[j]
                    new_children = tuple(new_visited[visited.index(child)] for child in parent.children)
                    new_visited[j] = parent.with_children(*new_children)
                return new_visited[-1]
        return self





[docs]
def expr_pretty_print(expr: Expr, indent: int = 0) -> str:
    """Pretty print an expression in SSA form."""
    from boundlab.expr import TupleExpr, GetTupleItem
    visited = expr.all_subnodes()

    def can_fuse(e: Union[Expr, TupleExpr]) -> bool:
        if isinstance(e, Expr):
            return (ExprFlags.PRINT_FUSE in e.flags)
        else: 
            return False
        
    def get_children(e: Union[Expr, TupleExpr]) -> tuple[Union[Expr, TupleExpr], ...]:
            if isinstance(e, GetTupleItem):
                return (e.tuple_expr,)
            return e.children

    expr_to_str = {}

    def get_expr_str(e: Union[Expr, TupleExpr]) -> str:
        if e in expr_to_str:
            return expr_to_str[e]
        
        children_strs = []
        for child in get_children(e):
            if can_fuse(child):
                children_strs.append(get_expr_str(child))
            else:
                children_strs.append(f'%{visited.index(child)}')
        result = e.to_string(*children_strs)
        expr_to_str[e] = result
        return result

    output = []
    for i, e in enumerate(visited):
        if can_fuse(e):
            continue
        get_expr_str(e)
        output.append((" " * indent) + f"%{i} = {expr_to_str[e]}")
    return "\n".join(output)