Source code for rlaopt.expression.expression

"""Expression module for symbolic optimization modeling.

This module provides the core expression class for building symbolic mathematical
expressions that can be evaluated, differentiated, and optimized. Expressions are
built compositionally through operator overloading and can represent optimization
objectives, constraints, and models.

Classes:
    Expression: Abstract base class for all expressions.
"""

from abc import ABC, abstractmethod
from collections import defaultdict

import torch
from typing_extensions import Self

from rlaopt.expression import expr_types
from rlaopt.expression.tree import ExprTree
from rlaopt.expression.utils import _create_product, _create_sum
from rlaopt.ext_tensordict import TensorDict



[docs]
class Expression(torch.nn.Module, ABC):
    """Abstract base class for all expressions.

    Expression extends torch.nn.Module to provide automatic parameter tracking,
    gradient computation, and device management. All concrete expression types
    (Variable, SumExpression, etc.) inherit from this base class.

    Expressions support operator overloading for natural mathematical syntax:
        - Arithmetic: +, -, *, /, @, **
        - Comparisons: Used in constraints (future)
        - Composition: Expressions can be nested arbitrarily

    Attributes:
        None (abstract class)
    """


[docs]
    def __init__(self):
        """Initialize the Expression base class."""
        super().__init__()



[docs]
    @abstractmethod
    def is_smooth(self) -> bool:
        """Check if the expression is smooth (differentiable everywhere).

        Smoothness is important for choosing optimization algorithms. Smooth
        expressions can use gradient-based methods, while non-smooth expressions
        require specialized algorithms like proximal methods or subgradient methods.

        Returns:
            bool: True if the expression is smooth, False otherwise.
        """
        pass



[docs]
    @abstractmethod
    def forward(self) -> torch.Tensor:
        """Evaluate the expression using current parameter values.

        This method evaluates the expression with the current values of all
        registered parameters.

        Returns:
            torch.Tensor: The evaluated result.
        """
        pass



[docs]
    @abstractmethod
    def tree(self) -> ExprTree:
        """Return a tree representation of the expression structure.

        Returns an ExprTree object showing how expressions are composed.
        Useful for testing that expression optimizations (constant folding,
        flattening, etc.) are working correctly.

        Each subclass implements this method to expose its own structure without
        leaking implementation details to the base class.

        Returns:
            ExprTree: Tree structure with node type and children.
        """
        pass



[docs]
    def is_affine(self) -> bool:
        """Check if the expression is affine.

        An expression is affine if it can be expressed as a linear function of variables
        plus a constant.

        Returns:
            bool: True if the expression is affine, False otherwise.
        """
        return False



[docs]
    def evaluate(self, variable_values: TensorDict) -> torch.Tensor:
        """Evaluate the expression at specified variable values.

        Unlike forward(), this method evaluates the expression at variable
        values different from those currently stored. Useful for line searches,
        parameter exploration, etc.

        Note that the user can specify a partial set of variables; any variables
        not included will be evaluated at their current stored values. Any variables in
        the input that are not part of this expression will be ignored.

        Args:
            variable_values: Dictionary mapping variable names to their values.

        Returns:
            torch.Tensor: The evaluated result.

        Examples:
            >>> x = Variable((5,), name='x')
            >>> new_params = TensorDict({'x': torch.ones(5)})
            >>> result = x.evaluate(new_params)
            >>> torch.equal(result, new_params['x'])
            True
        """
        variable_values_selected = self.select_relevant_variables(variable_values)
        params = self._variable_values_to_params_dict(variable_values_selected)
        result = torch.func.functional_call(
            self, params, args=None, kwargs=None, tie_weights=False
        )

        return result


    @property
    def variable_values(self) -> TensorDict:
        """Get variables as a dictionary.

        Returns:
            TensorDict: Dictionary of variable names to variable tensors.
        """
        vars_dict = {}
        for _, module in self.named_modules():
            if (
                isinstance(module, expr_types.variable())
                and module.name not in vars_dict
            ):
                vars_dict[module.name] = module.value
        return TensorDict(vars_dict)


[docs]
    def get_variable_names(self) -> list[str]:
        """Returns the list of variable names in order."""
        return list(self.variable_values.keys())



[docs]
    def get_variable_shapes(self) -> dict[str, torch.Size]:
        """Returns a dictionary mapping variable names to their shapes."""
        return {var_name: var.shape for var_name, var in self.variable_values.items()}



[docs]
    def update_variables(self, variable_values: TensorDict):
        """Update variables from a TensorDict.

        Note that this method allows partial updates; only the variables
        specified in the input TensorDict will be updated, while others
        will remain unchanged. Any variables in the input that are not
        part of this expression will be ignored.

        Args:
            variable_values (TensorDict): TensorDict with new variable values.

        Examples:
            >>> x = Variable((5,), name='x')
            >>> x.update_variables(TensorDict({'x': torch.ones(5)}))
            >>> torch.equal(x.value, torch.ones(5))
            True
        """
        variable_values_selected = self.select_relevant_variables(variable_values)
        params_dict = self._variable_values_to_params_dict(variable_values_selected)
        # Use strict=False to allow partial updates
        self.load_state_dict(params_dict, strict=False)



[docs]
    def select_relevant_variables(self, variable_values: TensorDict) -> TensorDict:
        """Select variables relevant to this expression from a TensorDict.

        Args:
            variable_values (TensorDict): TensorDict containing variable values.

        Returns:
            TensorDict: TensorDict with only variables relevant to this expression.
        """
        relevant_var_names = self.get_variable_names()
        # Setting strict=False to avoid errors if some variables are missing
        return variable_values.select(*relevant_var_names, strict=False)


    def _variable_values_to_params_dict(self, variable_values: TensorDict) -> dict:
        """Convert a variables dict to a parameters dict.

        Maps variable names to their corresponding parameter names in the
        module hierarchy.
        """
        vars_to_param_names_map = self._get_variables_to_param_names_mapping()
        params_dict = {}
        for var_name, tensor in variable_values.items():
            for param_name in vars_to_param_names_map[var_name]:
                params_dict[param_name] = tensor
        return params_dict

    def _get_variables_to_param_names_mapping(self) -> dict[str, list[str]]:
        mapping = defaultdict(list)
        for module_path, module in self.named_modules():
            if isinstance(module, expr_types.variable()):
                # We have to account for the full module path to get
                # the correct parameter name
                full_param_name = (
                    f"{module_path}.{module._name}" if module_path else module._name
                )
                mapping[module.name].append(full_param_name)
        return mapping


[docs]
    def transpose(self) -> Self:
        """Create a transpose operation.

        Optimizes double transpose (A.T.T returns A).

        Returns:
            Expression: Transposed expression or original if already transposed twice.
        """
        from rlaopt.expression.unary_expressions import Transpose

        # Optimize A.T.T -> A
        if isinstance(self, Transpose):
            return self.operand
        return Transpose(self)


    @property
    def T(self) -> Self:
        """Transpose property (shorthand for transpose()).

        Returns:
            Expression: Transposed expression.
        """
        return self.transpose()


[docs]
    def sum(self, dim=None) -> Self:
        """Create a sum reduction operation.

        Args:
            dim: Dimension to sum over (None for all dimensions).

        Returns:
            ReduceSum: Expression computing the sum.
        """
        from rlaopt.expression.unary_expressions import ReduceSum

        return ReduceSum(self, dim=dim)


    # ----------------------
    # Centralized operator overloads
    # ----------------------

[docs]
    def __add__(self, other):
        """Add two expressions or an expression and a scalar.

        Args:
            other: Expression, float, or int to add.

        Returns:
            Expression: Sum of self and other (optimized).
        """
        return _create_sum(self, other)



[docs]
    def __radd__(self, other):
        """Add a scalar and an expression (reverse operation).

        Args:
            other: Float or int to add.

        Returns:
            Expression: Sum of other and self (optimized).
        """
        return _create_sum(other, self)



[docs]
    def __sub__(self, other):
        """Subtract an expression or scalar from this expression.

        Args:
            other: Expression, float, or int to subtract.

        Returns:
            Expression: Difference of self and other (optimized).
        """
        return _create_sum(self, -other)



[docs]
    def __rsub__(self, other):
        """Subtract this expression from a scalar (reverse operation).

        Args:
            other: Float or int to subtract from.

        Returns:
            Expression: Difference of other and self (optimized).
        """
        return _create_sum(other, -self)



[docs]
    def __neg__(self):
        """Negate this expression.

        Returns:
            Expression: Negation of self.
        """
        return _create_product(-1.0, self, matmul=False)



[docs]
    def __mul__(self, other):
        """Multiply this expression by another (elementwise).

        Args:
            other: Expression, float, or int to multiply.

        Returns:
            Expression: Elementwise product of self and other.
                If multiplying a scalar by a sum, automatically distributes.
        """
        return _create_product(self, other, matmul=False)



[docs]
    def __rmul__(self, other):
        """Multiply a scalar by this expression (reverse operation).

        Args:
            other: Float or int to multiply.

        Returns:
            Expression: Elementwise product of other and self.
                If multiplying a scalar by a sum, automatically distributes.
        """
        return _create_product(other, self, matmul=False)



[docs]
    def __truediv__(self, other):
        """Divide this expression by a scalar.

        Args:
            other: Float or int to divide by.

        Returns:
            Expression: Result of division (optimized).
                If dividing a sum by a scalar, automatically distributes.
        """
        if isinstance(other, (int, float)):
            return _create_product(self, 1.0 / other, matmul=False)
        return NotImplemented



[docs]
    def __matmul__(self, other):
        """Matrix multiply this expression by another.

        Args:
            other: Expression, float, or int to multiply.

        Returns:
            Expression: Matrix product of self and other.
        """
        return _create_product(self, other, matmul=True)



[docs]
    def __rmatmul__(self, other):
        """Matrix multiply a value by this expression (reverse operation).

        Args:
            other: Expression, float, or int to multiply.

        Returns:
            Expression: Matrix product of other and self.
        """
        return _create_product(other, self, matmul=True)



[docs]
    def __pow__(self, exponent):
        """Raise this expression to a power (elementwise).

        Args:
            exponent: Power to raise to.

        Returns:
            Expression: Result of exponentiation.
        """
        from rlaopt.expression.unary_expressions import Power

        return Power(self, exponent)