Source code for torch_openreml.covariance.operator_kronecker_product
"""
Kronecker product covariance operator.
This module provides a Kronecker product operator for combining two
covariance matrices, for use in linear mixed-effects models.
Classes:
KroneckerProduct:
A Kronecker product covariance operator :math:`V = A \\otimes B`.
"""
from torch_openreml.covariance.operator import Operator
import torch
[docs]
class KroneckerProduct(Operator):
r"""
Kronecker product of two covariance matrices.
.. math::
\symbf{V} = \symbf{A} \otimes \symbf{B}
If :math:`\symbf{A}` is :math:`m \times m` and :math:`\symbf{B}` is
:math:`n \times n`, the result is an :math:`mn \times mn` matrix. Either
or both operands may be trainable
:class:`~torch_openreml.covariance.matrix.Matrix` instances or fixed
:class:`torch.Tensor` values.
"""
def __init__(self, *args, **kwargs):
"""
Initialize a Kronecker product operator from exactly two operands.
Args:
*args: Exactly two operands as positional arguments or a single
dict. The first is :math:`\\symbf{A}`, the second
:math:`\\symbf{B}`.
**kwargs: Exactly two operands as keyword arguments.
Raises:
ValueError: If the number of operands is not exactly two.
Example:
.. jupyter-execute::
import torch
from torch_openreml.covariance import AR1Matrix, ScalarMatrix, KroneckerProduct
op = KroneckerProduct(time=AR1Matrix(2), subject=ScalarMatrix(2))
params = torch.tensor([1.0, 1.0, 1.0])
op(params)
"""
super().__init__(*args, **kwargs)
if len(self.operands) != 2:
raise ValueError("Two operands are required")
def _get_or_build_intermediates(self, free_params):
built_params = self.build_params(free_params)
cache = self.get_intermediates(built_params)
if cache is None:
v_groups = self.build_operands(free_params)
a = v_groups[0]
b = v_groups[1]
v = torch.kron(a, b)
cache = {"a": a, "b": b, "v": v}
self.set_intermediates(built_params, cache)
return cache
[docs]
def __call__(self, free_params=None):
if free_params is None:
free_params = self.free_param_defaults
cache = self._get_or_build_intermediates(free_params)
v = cache["v"]
self._shape = tuple(v.shape)
return v
[docs]
def manual_grad(self, free_params=None):
"""
Compute the Jacobian of :meth:`__call__` with respect to trainable
parameters using a closed-form analytic expression.
Applies the product rule: if :math:`\\symbf{V} = \\symbf{A} \\otimes \\symbf{B}`
then the gradient with respect to :math:`\\theta_{\\symbf{A}}` is
:math:`\\frac{\\partial \\symbf{A}}{\\partial \\theta_{\\symbf{A}}} \\otimes \\symbf{B}`,
and similarly for :math:`\\theta_{\\symbf{B}}`. Per-operand Jacobians
from :meth:`~torch_openreml.covariance.operator.Operator.operands_grad`
are Kronecker-multiplied by the other operand's value.
Args:
free_params (torch.Tensor or dict): Flat 1D parameter tensor or
parameter dictionary.
If omitted, default values are used. Default: ``None``.
Returns:
tuple: ``(grad, grad_names)``, where ``grad`` is a 3D tensor of
shape ``(num_free_params, *shape)`` and ``grad_names`` is a list
of the corresponding parameter names. Returns ``(None, [])`` if
all parameters are fixed.
Raises:
TypeError: If ``free_params`` is not a Torch tensor.
ValueError: If ``free_params`` is not a 1D tensor or has the
wrong length, or if ``free_params`` is a dict with missing
or unexpected keys.
Example:
.. jupyter-execute::
import torch
from torch_openreml.covariance import AR1Matrix, ScalarMatrix, KroneckerProduct
op = KroneckerProduct(time=AR1Matrix(2), subject=ScalarMatrix(2))
params = torch.tensor([1.0, 1.0, 1.0])
grad, grad_names = op.manual_grad(params)
grad
.. jupyter-execute::
grad_names
"""
if free_params is None:
free_params = self.free_param_defaults
grad_groups, grad_name_groups = self.operands_grad(free_params)
cache = self._get_or_build_intermediates(free_params)
a = cache["a"]
b = cache["b"]
grad = []
grad_names = []
da = grad_groups[0]
if da is not None:
grad.append(torch.kron(da, b))
grad_names.extend(grad_name_groups[0])
db = grad_groups[1]
if db is not None:
grad.append(torch.kron(a, db))
grad_names.extend(grad_name_groups[1])
if len(grad) > 0:
grad = torch.cat(grad)
return grad, grad_names
else:
return None, []