Source code for deepdow.benchmarks

"""Collection of benchmarks."""
from abc import ABC, abstractmethod

import cvxpy as cp
from cvxpylayers.torch import CvxpyLayer
import torch

from .layers import CovarianceMatrix


[docs]class Benchmark(ABC):
    """Abstract benchmark class.

    The idea is to create some benchmarks that we can use for comparison to our neural networks. Note that we
    assume that benchmarks are not trainable - one can only use them for inference.

    """

[docs]    @abstractmethod
    def __call__(self, x):
        """Prediction of the model."""

    @property
    def hparams(self):
        """Hyperparamters relevant to construction of the model."""
        return {}


[docs]class InverseVolatility(Benchmark):
    """Allocation only considering volatility of individual assets.

    Parameters
    ----------
    use_std : bool
        If True, then we use standard deviation as a measure of volatility. Otherwise variance is used.

    returns_channel : int
        Which channel in the `x` feature matrix to consider (the 2nd dimension) as returns.

    """

    def __init__(self, use_std=False, returns_channel=0):
        self.use_std = use_std
        self.returns_channel = returns_channel

[docs]    def __call__(self, x):
        """Predict weights.

        Parameters
        ----------
        x : torch.Tensor
            Tensor of shape `(n_samples, n_channels, lookback, n_assets)`.

        Returns
        -------
        weights : torch.Tensor
            Tensor of shape `(n_samples, n_assets)` representing the predicted weights.

        """
        eps = 1e-6
        x_rets = x[:, self.returns_channel, ...]
        vols = x_rets.std(dim=1) if self.use_std else x_rets.var(dim=1)
        ivols = 1 / (vols + eps)
        weights = ivols / ivols.sum(dim=1, keepdim=True)

        return weights

    @property
    def hparams(self):
        """Hyperparamters relevant to construction of the model."""
        return {'use_std': self.use_std,
                'returns_channel': self.returns_channel}


[docs]class MaximumReturn(Benchmark):
    """Markowitz portfolio optimization - maximum return.

    Parameters
    ----------
    max_weight : float
        A number in (0, 1] representing the maximum weight per asset.

    n_assets : None or int
        If specifed the benchmark will always have to be provided with `n_assets` of assets in the `__call__`.
        This way one can achieve major speedups since the optimization problem is canonicalized only once in the
        constructor. However, when `n_assets` is None the optimization problem is canonicalized before each
        inside of `__call__` which results in overhead but allows for variable number of assets.

    returns_channel : int
        Which channel in the `x` feature matrix to consider (the 2nd dimension) as returns.

    Attributes
    ----------
    optlayer : cvxpylayers.torch.CvxpyLayer or None
        Equal to None if `n_assets` not provided in the constructor. In this case optimization problem is constructed
        with each forward pass. This allows for variable number of assets but is slower. If `n_assets` provided than
        constructed once and for all in the constructor.

    """

    def __init__(self, max_weight=1, n_assets=None, returns_channel=0):
        self.max_weight = max_weight
        self.n_assets = n_assets
        self.returns_channel = returns_channel

        self.optlayer = self._construct_problem(n_assets, max_weight) if self.n_assets is not None else None

    @staticmethod
    def _construct_problem(n_assets, max_weight):
        """Construct cvxpylayers problem."""
        rets = cp.Parameter(n_assets)
        w = cp.Variable(n_assets)

        ret = rets @ w
        prob = cp.Problem(cp.Maximize(ret), [cp.sum(w) == 1,
                                             w >= 0,
                                             w <= max_weight])

        return CvxpyLayer(prob, parameters=[rets], variables=[w])

[docs]    def __call__(self, x):
        """Predict weights.

        Parameters
        ----------
        x : torch.Tensor
            Tensor of shape `(n_samples, n_channels, lookback, n_assets)`.

        Returns
        -------
        weights : torch.Tensor
            Tensor of shape `(n_samples, n_assets)` representing the predicted weights.

        """
        n_samples, _, lookback, n_assets = x.shape

        # Problem setup
        if self.optlayer is not None:
            if self.n_assets != n_assets:
                raise ValueError('Incorrect number of assets: {}, expected: {}'.format(n_assets, self.n_assets))

            optlayer = self.optlayer
        else:
            optlayer = self._construct_problem(n_assets, self.max_weight)

        rets_estimate = x[:, self.returns_channel, :, :].mean(dim=1)  # (n_samples, n_assets)

        return optlayer(rets_estimate)[0]

    @property
    def hparams(self):
        """Hyperparamters relevant to construction of the model."""
        return {'max_weight': self.max_weight,
                'returns_channel': self.returns_channel,
                'n_assets': self.n_assets}


[docs]class MinimumVariance(Benchmark):
    """Markowitz portfolio optimization - minimum variance.

    Parameters
    ----------
    max_weight : float
        A number in (0, 1] representing the maximum weight per asset.

    n_assets : None or int
        If specifed the benchmark will always have to be provided with `n_assets` of assets in the `__call__`.
        This way one can achieve major speedups since the optimization problem is canonicalized only once in the
        constructor. However, when `n_assets` is None the optimization problem is canonicalized before each
        inside of `__call__` which results in overhead but allows for variable number of assets.

    returns_channel : int
        Which channel in the `x` feature matrix to consider (the 2nd dimension) as returns.

    Attributes
    ----------
    optlayer : cvxpylayers.torch.CvxpyLayer or None
        Equal to None if `n_assets` not provided in the constructor. In this case optimization problem is constructed
        with each forward pass. This allows for variable number of assets but is slower. If `n_assets` provided than
        constructed once and for all in the constructor.

    """

    def __init__(self, max_weight=1, returns_channel=0, n_assets=None):
        self.n_assets = n_assets
        self.returns_channel = returns_channel
        self.max_weight = max_weight

        self.optlayer = self._construct_problem(n_assets, max_weight) if self.n_assets is not None else None

    @staticmethod
    def _construct_problem(n_assets, max_weight):
        """Construct cvxpylayers problem."""
        covmat_sqrt = cp.Parameter((n_assets, n_assets))
        w = cp.Variable(n_assets)

        risk = cp.sum_squares(covmat_sqrt @ w)
        prob = cp.Problem(cp.Minimize(risk), [cp.sum(w) == 1,
                                              w >= 0,
                                              w <= max_weight])

        return CvxpyLayer(prob, parameters=[covmat_sqrt], variables=[w])

[docs]    def __call__(self, x):
        """Predict weights.

        Parameters
        ----------
        x : torch.Tensor
            Tensor of shape `(n_samples, n_channels, lookback, n_assets)`.

        Returns
        -------
        weights : torch.Tensor
            Tensor of shape `(n_samples, n_assets)` representing the predicted weights.

        """
        n_samples, _, lookback, n_assets = x.shape

        # Problem setup
        if self.optlayer is not None:
            if self.n_assets != n_assets:
                raise ValueError('Incorrect number of assets: {}, expected: {}'.format(n_assets, self.n_assets))

            optlayer = self.optlayer
        else:
            optlayer = self._construct_problem(n_assets, self.max_weight)

        # problem solver
        covmat_sqrt_estimates = CovarianceMatrix(sqrt=True)(x[:, self.returns_channel, :, :])

        return optlayer(covmat_sqrt_estimates)[0]

    @property
    def hparams(self):
        """Hyperparamters relevant to construction of the model."""
        return {'max_weight': self.max_weight,
                'returns_channel': self.returns_channel,
                'n_assets': self.n_assets}


[docs]class OneOverN(Benchmark):
    """Equally weighted portfolio."""

[docs]    def __call__(self, x):
        """Predict weights.

        Parameters
        ----------
        x : torch.Tensor
            Tensor of shape `(n_samples, n_channels, lookback, n_assets)`.

        Returns
        -------
        weights : torch.Tensor
            Tensor of shape `(n_samples, n_assets)` representing the predicted weights.

        """
        n_samples, n_channels, lookback, n_assets = x.shape

        return torch.ones((n_samples, n_assets), dtype=x.dtype, device=x.device) / n_assets


[docs]class Random(Benchmark):
    """Random allocation for each prediction."""

[docs]    def __call__(self, x):
        """Predict weights.

        Parameters
        ----------
        x : torch.Tensor
            Tensor of shape `(n_samples, n_channels, lookback, n_assets)`.

        Returns
        -------
        weights : torch.Tensor
            Tensor of shape `(n_samples, n_assets)` representing the predicted weights.

        """
        n_samples, n_channels, lookback, n_assets = x.shape

        weights_unscaled = torch.rand((n_samples, n_assets), dtype=x.dtype, device=x.device)
        weights_sums = weights_unscaled.sum(dim=1, keepdim=True).repeat(1, n_assets)

        return weights_unscaled / weights_sums


[docs]class Singleton(Benchmark):
    """Predict a single asset.

    Parameters
    ----------
    asset_ix : int
        Index of the asset to predict.

    """

    def __init__(self, asset_ix):
        self.asset_ix = asset_ix

[docs]    def __call__(self, x):
        """Predict weights.

        Parameters
        ----------
        x : torch.Tensor
            Tensor of shape `(n_samples, n_channels, lookback, n_assets)`.

        Returns
        -------
        weights : torch.Tensor
            Tensor of shape `(n_samples, n_assets)` representing the predicted weights.

        """
        n_samples, n_channels, lookback, n_assets = x.shape

        if self.asset_ix not in set(range(n_assets)):
            raise IndexError('The selected asset index is out of range.')

        weights = torch.zeros((n_samples, n_assets), dtype=x.dtype, device=x.device)
        weights[:, self.asset_ix] = 1

        return weights

    @property
    def hparams(self):
        """Hyperparamters relevant to construction of the model."""
        return {'asset_ix': self.asset_ix}