universal/algos/mpt.py

import logging

import numpy as np
import pandas as pd
from cvxopt import matrix, solvers
from scipy import optimize
from six import string_types
from sklearn import covariance
from sklearn.base import BaseEstimator

from .. import tools
from ..algo import Algo
from .estimators import *

solvers.options["show_progress"] = False


class MPT(Algo):
    """Modern portfolio theory approach. See https://en.wikipedia.org/wiki/Modern_portfolio_theory."""

    PRICE_TYPE = "ratio"

    def __init__(
        self,
        window=None,
        mu_estimator=None,
        cov_estimator=None,
        mu_window=None,
        cov_window=None,
        min_history=None,
        bounds=None,
        max_leverage=1.0,
        method="mpt",
        q=0.01,
        gamma=0.0,
        optimizer_options=None,
        force_weights=None,
        **kwargs,
    ):
        """
        :param window: Window for calculating mean and variance. Use None for entire history.
        :param mu_estimator: TODO
        :param cov_estimator: TODO
        :param min_history: Use zero weights for first min_periods. Default is 1 year
        :param max_leverage: Max leverage to use.
        :param method: optimization objective - can be "mpt", "sharpe" and "variance"
        :param q: depends on method, e.g. for "mpt" it is risk aversion parameter (higher means lower aversion to risk)
            from https://en.wikipedia.org/wiki/Modern_portfolio_theory#Efficient_frontier_with_no_risk-free_asset
            q=2 is equivalent to full-kelly, q=1 is equivalent to half kelly
        :param gamma: Penalize changing weights (can be number or Series with individual weights such as fees)
        """
        super().__init__(min_history=min_history, **kwargs)
        mu_window = mu_window or window
        cov_window = cov_window or window
        self.method = method
        self.q = q
        self.gamma = gamma
        self.bounds = bounds or {}
        self.force_weights = force_weights
        self.max_leverage = max_leverage
        self.optimizer_options = optimizer_options or {}

        if bounds and max_leverage != 1:
            raise NotImplemented(
                "max_leverage cannot be used with bounds, consider removing max_leverage and replace it with bounds1"
            )

        if cov_estimator is None:
            cov_estimator = "empirical"

        if isinstance(cov_estimator, string_types):
            if cov_estimator == "empirical":
                # use pandas covariance in init_step
                cov_estimator = covariance.EmpiricalCovariance()
            elif cov_estimator == "ledoit-wolf":
                cov_estimator = covariance.LedoitWolf()
            elif cov_estimator == "graph-lasso":
                cov_estimator = covariance.GraphLasso()
            elif cov_estimator == "oas":
                cov_estimator = covariance.OAS()
            elif cov_estimator == "single-index":
                cov_estimator = SingleIndexCovariance()
            else:
                raise NotImplemented(
                    "Unknown covariance estimator {}".format(cov_estimator)
                )

        # handle sklearn models
        if isinstance(cov_estimator, BaseEstimator):
            cov_estimator = CovarianceEstimator(cov_estimator, window=cov_window)

        if mu_estimator is None:
            mu_estimator = SharpeEstimator()

        if isinstance(mu_estimator, string_types):
            if mu_estimator == "historical":
                mu_estimator = HistoricalEstimator(window=mu_window)
            elif mu_estimator == "sharpe":
                mu_estimator = SharpeEstimator()
            else:
                raise NotImplemented("Unknown mu estimator {}".format(mu_estimator))

        self.cov_estimator = cov_estimator
        self.mu_estimator = mu_estimator

    def init_weights(self, columns):
        b = np.array([0.0 if c == "CASH" else 1.0 for c in columns])
        return b / b.sum()

    def init_step(self, X):
        # set min history to 1 year
        if not self.min_history:
            self.min_history = tools.freq(X.index)

        # replace covariance estimator with empirical covariance and precompute it
        if isinstance(self.cov_estimator, covariance.EmpiricalCovariance):

            class EmpiricalCov(object):
                """Behave like sklearn covariance estimator."""

                allow_nan = True

                def __init__(self, X, window, min_history):
                    self.C = tools.rolling_cov_pairwise(
                        X, window=window, min_periods=min_history
                    )

                def fit(self, X):
                    # get sigma matrix
                    x = X.iloc[-1]
                    sigma = self.C[x.name]

                    # make sure sigma is properly indexed
                    sigma = sigma.reindex(index=x.index).reindex(columns=x.index)

                    self.covariance_ = sigma.values
                    return self

            self.cov_estimator = CovarianceEstimator(
                EmpiricalCov(X, self.cov_estimator.window, self.min_history)
            )

    def estimate_mu_sigma_sh(self, S):
        X = self._convert_prices(S, self.PRICE_TYPE, self.REPLACE_MISSING)

        sigma = self.cov_estimator.fit(X - 1)
        mu = self.mu_estimator.fit(X, sigma)
        vol = np.sqrt(np.diag(sigma))
        sh = (mu - self.mu_estimator.rfr) / vol
        sh[vol == 0] = 0.0

        return mu, sigma, sh

    def portfolio_mu(self, last_b, mu):
        return (last_b * mu).sum()

    def portfolio_vol(self, last_b, sigma):
        w = last_b.values
        sigma = sigma.reindex(index=last_b.index, columns=last_b.index).values
        return np.sqrt((w @ sigma @ w))

    def portfolio_gradient(self, last_b, mu, sigma, q=None, decompose=False):
        """Calculate gradient for given objective function. Can be used to determine which stocks
        should be added / removed from portfolio.
        """
        q = q or self.q
        w = last_b.values
        mu = mu.values
        sigma = sigma.values

        p_vol = np.sqrt(w @ sigma @ w)
        p_mu = w @ mu

        if self.method == "sharpe":
            grad_sharpe = mu.T / p_vol
            grad_vol = -sigma * w.T * p_mu / p_vol ** 3

            grad_sharpe = pd.Series(np.array(grad_sharpe).ravel(), index=last_b.index)
            grad_vol = pd.Series(np.array(grad_vol).ravel(), index=last_b.index)

            if decompose:
                return grad_sharpe, grad_vol
            else:
                return grad_sharpe + grad_vol
        elif self.method == "mpt":
            grad_mu = pd.Series(np.array(mu).ravel(), index=last_b.index)
            grad_sigma = pd.Series((sigma @ w).ravel(), index=last_b.index)
            grad_vol = pd.Series(
                np.array(-sigma @ w / p_vol).ravel(), index=last_b.index
            )

            if decompose:
                return grad_mu, grad_vol
            else:
                return q * grad_mu - 2 * grad_sigma
        else:
            raise NotImplemented("Method {} not yet implemented".format(self.method))

    def step(self, x, last_b, history, **kwargs):
        # get sigma and mu estimates
        X = history

        if self.bounds.keys() - X.columns - {"all"}:
            raise Exception(
                f'Bounds for undefined symbols {self.bounds.keys() - X.columns - set(["all"])}'
            )

        # remove assets with NaN values
        # cov_est = self.cov_estimator.cov_est
        # if hasattr(cov_est, 'allow_nan') and cov_est.allow_nan:
        #     na_assets = (X.notnull().sum() < self.min_history).values
        # else:
        #     na_assets = X.isnull().any().values

        # check NA assets
        na_assets = (X.notnull().sum() < self.min_history).values
        if any(na_assets):
            logging.warning(
                "Assets containing null values: {}".format(X.columns[na_assets])
            )
            # raise Exception('Assets containing null values: {}'.format(X.columns[na_assets]))

        # TODO: should we enable this?
        # X = X.iloc[:, ~na_assets]
        # x = x[~na_assets]
        # last_b = last_b[~na_assets]

        # get sigma and mu estimations
        sigma = self.cov_estimator.fit(X - 1)
        mu = self.mu_estimator.fit(X, sigma)

        ss = pd.Series(np.diag(sigma), index=sigma.columns)

        assert (mu.index == X.columns).all()

        # make Series from gamma
        gamma = self.gamma
        if isinstance(gamma, float):
            gamma = x * 0 + gamma
        elif callable(gamma):
            # use gamma as a function
            pass
        else:
            gamma = gamma.reindex(x.index)
            gamma_null = gamma[gamma.isnull()]
            assert len(gamma_null) == 0, "gamma is missing values for {}".format(
                gamma_null.index
            )

        # find optimal portfolio
        last_b = pd.Series(last_b, index=x.index, name=x.name)
        b = self.optimize(
            mu,
            sigma,
            q=self.q,
            gamma=gamma,
            max_leverage=self.max_leverage,
            last_b=last_b,
            **kwargs,
        )
        b = pd.Series(b, index=X.columns).reindex(history.columns, fill_value=0.0)

        return b

    def optimize(self, mu, sigma, q, gamma, max_leverage, last_b, **kwargs):
        if self.method == "mpt":
            return self._optimize_mpt(mu, sigma, q, gamma, last_b, **kwargs)
        elif self.method == "sharpe":
            return self._optimize_sharpe(
                mu, sigma, q, gamma, max_leverage, last_b, **kwargs
            )
        elif self.method == "variance":
            return self._optimize_variance(
                mu, sigma, q, gamma, max_leverage, last_b, **kwargs
            )
        else:
            raise Exception("Unknown method {}".format(self.method))

    def _optimize_sharpe(self, mu, sigma, q, gamma, max_leverage, last_b):
        """Maximize sharpe ratio b.T * mu / sqrt(b.T * sigma * b + q)"""
        mu = np.matrix(mu)
        sigma = np.matrix(sigma)

        def maximize(bb):
            if callable(gamma):
                fee_penalization = gamma(pd.Series(bb, index=last_b.index), last_b)
            else:
                fee_penalization = sum(gamma * abs(bb - last_b))
            bb = np.matrix(bb)
            return -mu * bb.T / np.sqrt(bb * sigma * bb.T + q) + fee_penalization

        if self.allow_cash:
            cons = ({"type": "ineq", "fun": lambda b: max_leverage - sum(b)},)
        else:
            cons = ({"type": "eq", "fun": lambda b: max_leverage - sum(b)},)

        bounds = [(0.0, max_leverage)] * len(last_b)

        if self.max_weight:
            bounds = [
                (max(l, -self.max_weight), min(u, self.max_weight)) for l, u in bounds
            ]

        x0 = last_b
        MAX_TRIES = 3

        for _ in range(MAX_TRIES):
            res = optimize.minimize(
                maximize,
                x0,
                bounds=bounds,
                constraints=cons,
                method="slsqp",
                options=self.optimizer_options,
            )

            # it is possible that slsqp gives out-of-bounds error, try it again with different x0
            if np.any(res.x < -0.01) or np.any(res.x > max_leverage + 0.01):
                x0 = np.random.random(len(res.x))
            else:
                break
        else:
            raise Exception()

        return res.x

    def _optimize_mpt(self, mu, sigma, q, gamma, last_b):
        """Minimize b.T * sigma * b - q * b.T * mu"""
        assert (mu.index == sigma.columns).all()
        assert (mu.index == last_b.index).all()

        symbols = list(mu.index)
        sigma = np.array(sigma)
        mu = np.array(mu).T
        n = len(symbols)

        force_weights = self.force_weights or {}

        # portfolio constraints
        bounds = self.bounds or {}
        if "all" not in bounds:
            bounds["all"] = (0, 1)

        G = []
        h = []
        for i, sym in enumerate(symbols):
            # forced weights
            if sym in force_weights:
                continue

            # constraints
            lower, upper = bounds.get(sym, bounds["all"])
            if lower is not None:
                r = np.zeros(n)
                r[i] = -1
                G.append(r)
                h.append(-lower)

            if upper is not None:
                r = np.zeros(n)
                r[i] = 1
                G.append(r)
                h.append(upper)

            # # additional constraints on selling
            # if sym not in allow_sell:
            #     r = np.zeros(n)
            #     r[i] = -1
            #     G.append(r)
            #     h.append(-last_b[i])

        G = matrix(np.vstack(G).astype(float))
        h = matrix(np.array(h).astype(float))

        b = _maximize(mu, sigma, q, n, G, h, symbols, last_b, force_weights)
        # try:
        #     b = maximize(mu, sigma, q)
        # except ValueError as e:
        #     raise e
        #     b = last_b

        # second optimization for fees
        if (gamma != 0).any() and (b != last_b).any():
            b = maximize_with_penalization(b, last_b, mu, sigma, q, gamma)
        return b

    def _optimize_variance(self, mu, sigma, q, gamma, max_leverage, last_b):
        """Minimize b.T * sigma * b subject to b.T * mu >= q. If you find no such solution,
        just maximize return."""
        sigma = np.matrix(sigma)
        mu = np.matrix(mu)

        def maximize(mu, sigma, q):
            n = len(last_b)

            P = matrix(2 * sigma)
            qq = matrix(np.zeros(n))
            G = matrix(np.r_[-np.eye(n), -mu])
            h = matrix(np.r_[np.zeros(n), -q])

            try:
                if max_leverage is None or max_leverage == float("inf"):
                    sol = solvers.qp(P, qq, G, h)
                else:
                    if self.allow_cash:
                        G = matrix(np.r_[G, matrix(np.ones(n)).T])
                        h = matrix(np.r_[h, matrix([self.max_leverage])])
                        sol = solvers.qp(P, qq, G, h, initvals=last_b)
                    else:
                        A = matrix(np.ones(n)).T
                        b = matrix(np.array([max_leverage]))
                        sol = solvers.qp(P, qq, G, h, A, b, initvals=last_b)

                if sol["status"] == "unknown":
                    raise ValueError()

            except ValueError:
                # no feasible solution - maximize return instead
                P = P * 0
                qq = matrix(-mu.T)
                G = matrix(np.r_[-np.eye(n), matrix(np.ones(n)).T])
                h = matrix(np.r_[np.zeros(n), self.max_leverage])

                sol = solvers.qp(P, qq, G, h)

            return np.squeeze(sol["x"])

        b = maximize(mu, sigma, q)
        return b


# regularization parameter for singular cases
ALPHA = 0.000001


def _maximize(mu, sigma, q, n, G, h, symbols, last_b, force_weights):
    P = matrix(2 * (sigma + ALPHA * np.eye(n)))
    q = matrix(-q * mu + 2 * ALPHA * last_b.values)

    A = matrix(np.ones(n)).T
    b = matrix(np.array([1.0]))

    for sym, w in force_weights.items():
        ix = symbols.index(sym)
        a = np.zeros(n)
        a[ix] = 1
        A = matrix(np.r_[A, matrix(a).T])
        b = matrix(np.r_[b, matrix([w])])

    sol = solvers.qp(P, q, G, h, A, b, initvals=last_b)

    if sol["status"] != "optimal":
        logging.warning(
            "Solution not found for {}, using last weights".format(last_b.name)
        )
        return last_b

    return np.squeeze(sol["x"])


def _maximize_with_penalization(b, last_b, mu, sigma, q, gamma):
    n = len(mu)
    c = np.sign(b - last_b)
    sigma = matrix(sigma)
    mu = matrix(mu)

    P = 2 * (sigma + ALPHA * matrix(np.eye(n)))
    qq = 2 * sigma * matrix(last_b) - q * mu + matrix(gamma * c)

    G = matrix(np.r_[-np.diag(c), np.eye(n), -np.eye(n)])
    h = matrix(np.r_[np.zeros(n), 1.0 - last_b, last_b])

    A = matrix(np.ones(n)).T
    b = matrix([1.0 - sum(last_b)])

    sol = solvers.qp(P, qq, G, h, A, b, initvals=np.zeros(n))

    return np.squeeze(sol["x"]) + np.array(last_b)