Source code for quantammsim.pools.G3M.quantamm.triple_threat_mean_reversion_channel_pool

"""Triple-threat mean-reversion-channel pool for QuantAMM.

Combines three EWMA-based signals -- a channel (mean-reversion) component, a
trend (momentum) component, and a Gaussian envelope that gates between them --
into a single weight-update rule. Small price deviations activate the channel
signal; large deviations activate the trend signal via a power-law response.

Key parameters: ``width`` (envelope scale), ``amplitude`` (channel strength),
``exponents`` (trend power-law), three independent ``logit_lamb`` values for
channel, trend, and envelope memory lengths.
"""
# again, this only works on startup!
from jax import config

config.update("jax_enable_x64", True)
from jax import default_backend
from jax import local_device_count, devices

DEFAULT_BACKEND = default_backend()
CPU_DEVICE = devices("cpu")[0]
if DEFAULT_BACKEND != "cpu":
    GPU_DEVICE = devices("gpu")[0]
    config.update("jax_platform_name", "gpu")
else:
    GPU_DEVICE = devices("cpu")[0]
    config.update("jax_platform_name", "cpu")

import jax.numpy as jnp
from jax import jit, vmap
from jax import devices, device_put
from jax import tree_util
from jax.lax import stop_gradient, dynamic_slice

from quantammsim.pools.G3M.quantamm.momentum_pool import (
    MomentumPool,
    _jax_momentum_weight_update,
)
from quantammsim.core_simulator.param_utils import (
    memory_days_to_lamb,
    lamb_to_memory_days_clipped,
    calc_lamb,
    inverse_squareplus_np,
    get_raw_value,
    get_log_amplitude,
    logistic_func,
)
from quantammsim.pools.G3M.quantamm.update_rule_estimators.estimators import (
    calc_triple_threat_gradients,
    calc_k,
    squareplus,
)

from typing import Dict, Any, Optional
from functools import partial
import numpy as np

# import the fine weight output function which has pre-set argument rule_outputs_are_themselves_weights
# as this is False for momentum pools --- the strategy outputs weight _changes_
from quantammsim.pools.G3M.quantamm.weight_calculations.fine_weights import (
    calc_fine_weight_output_from_weight_changes,
)


@jit
def _jax_triple_threat_mean_reversion_channel_weight_update(
    price_gradient_channel,
    price_gradient_trend,
    price_gradient_envelope,
    k,
    width,
    amplitude,
    exponents,
    inverse_scaling=0.5415,
    pre_exp_scaling=0.5,
):
    """
    Compute weight updates for the triple-threat mean-reversion-channel rule.

    Combines a **channel portion** (mean reversion inside the envelope) with
    a **trend portion** (power-law momentum outside the envelope). The
    Gaussian envelope acts as a soft gate: near-zero gradient activates the
    channel signal; large gradient activates the trend signal.

    Channel math::

        envelope = exp(-g_env^2 / (2 * width^2))
        s_ch     = pi * g_ch / (3 * width)
        channel  = -amplitude * envelope * (s_ch - s_ch^3 / 6) / inverse_scaling

    Trend math::

        trend = (1 - envelope) * sign(g_trend)
                * |g_trend / (2 * pre_exp_scaling)|^exponents

    The final weight update is ``k * (channel + trend)``, with an
    offset subtracted to ensure the updates sum to zero across assets.

    Parameters
    ----------
    price_gradient_channel : jnp.ndarray
        EWMA price gradient used for the channel (mean-reversion) signal.
        Shape ``(T, n_assets)``.
    price_gradient_trend : jnp.ndarray
        EWMA price gradient used for the trend-following signal.
        Shape ``(T, n_assets)``.
    price_gradient_envelope : jnp.ndarray
        EWMA price gradient used to compute the Gaussian envelope.
        Shape ``(T, n_assets)``.
    k : jnp.ndarray
        Per-asset responsiveness scaling factor. Shape ``(n_assets,)``
        or broadcastable.
    width : jnp.ndarray
        Width (standard deviation) of the Gaussian envelope. Controls
        the boundary between mean-reversion and trend regimes.
    amplitude : jnp.ndarray
        Amplitude of the channel (mean-reversion) signal, typically
        scaled by ``memory_days``.
    exponents : jnp.ndarray
        Power-law exponents for the trend portion (passed through
        ``squareplus`` to ensure positivity).
    inverse_scaling : float, optional
        Normalisation constant for the channel portion, by default
        0.5415 (the maximum of ``sin(x)`` approximated by the cubic).
    pre_exp_scaling : float, optional
        Controls the relative contribution of the trend signal.
        Larger values attenuate the trend; smaller values amplify it.
        By default 0.5.

    Returns
    -------
    jnp.ndarray
        Weight updates for each asset at each timestep, summing to zero
        across assets. Shape ``(T, n_assets)``.
    """
    envelope = jnp.exp(-(price_gradient_envelope**2) / (2 * width**2))
    scaled_price_gradient = jnp.pi * price_gradient_channel / (3 * width)

    channel_portion = (
        -amplitude
        * envelope
        * (scaled_price_gradient - (scaled_price_gradient**3) / 6)
        / inverse_scaling
    )

    trend_portion = (
        (1 - envelope)
        * jnp.sign(price_gradient_trend)
        * jnp.power(jnp.abs(price_gradient_trend / (2.0 * pre_exp_scaling)), exponents)
    )
    signal = channel_portion + trend_portion

    offset_constants = -(k * signal).sum(axis=-1, keepdims=True) / (jnp.sum(k))
    weight_updates = k * (signal + offset_constants)
    return weight_updates



[docs]
class TripleThreatMeanReversionChannelPool(MomentumPool):
    """
    QuantAMM pool combining mean-reversion channel and trend-following rules.

    The "triple threat" refers to three interacting signal components:

    1. **Channel-based mean reversion** -- A Gaussian envelope modulates a
       cubic function of the normalised price gradient, producing a signal
       that reverts positions when price is within the channel width.
    2. **Trend component** -- Outside the channel, a power-law scaling of
       the price gradient drives trend-following behaviour.
    3. **Interaction** -- The ``pre_exp_scaling`` parameter controls the
       relative contribution of trend vs. channel; the Gaussian envelope
       naturally cross-fades between the two regimes.

    Each of the three signal components uses its own EWMA timescale
    (controlled by separate ``logit_lamb`` entries), allowing the channel,
    trend, and envelope to operate on different look-back horizons.

    Inherits from ``MomentumPool`` and overrides ``calculate_rule_outputs``
    to apply the triple-threat update rule instead of a pure momentum rule.

    See Also
    --------
    MeanReversionChannelPool : Channel-only (no trend) variant.
    MomentumPool : Pure trend-following base class.
    """


[docs]
    def __init__(self):
        """
        Initialize a new MeanReversionChannelPool instance.

        Parameters
        ----------
        None
        """
        super().__init__()



[docs]
    @partial(jit, static_argnums=(2))
    def calculate_rule_outputs(
        self,
        params: Dict[str, Any],
        run_fingerprint: Dict[str, Any],
        prices: jnp.ndarray,
        additional_oracle_input: Optional[jnp.ndarray] = None,
    ) -> jnp.ndarray:
        """
        Calculate the raw weight outputs based on mean reversion channel signals.

        This method computes the raw weight adjustments for the mean reversion channel strategy. It processes
        the input prices to calculate gradients, which are then used to determine weight updates.

        Parameters
        ----------
        params : Dict[str, Any]
            A dictionary of strategy parameters.
        run_fingerprint : Dict[str, Any]
            A dictionary containing run-specific settings.
        prices : jnp.ndarray
            An array of asset prices over time.
        additional_oracle_input : Optional[jnp.ndarray], optional
            Additional input data, if any.

        Returns
        -------
        jnp.ndarray
            Raw weight outputs representing the suggested weight adjustments.

        Notes
        -----
        The method performs the following steps:
        1. Calculates the memory days based on the lambda parameter.
        2. Computes the 'k' factor which scales the weight updates.
        3. Extracts chunkwise price values from the input prices.
        4. Calculates price gradients using the calc_gradients function.
        5. Applies the mean reversion channel weight update formula to get raw weight outputs.

        The raw weight outputs are not the final weights, but rather the changes
        to be applied to the previous weights. These will be refined in subsequent steps.
        """
        use_pre_exp_scaling = run_fingerprint["use_pre_exp_scaling"]
        if use_pre_exp_scaling and params.get("logit_pre_exp_scaling") is not None:
            logit_pre_exp_scaling = params.get("logit_pre_exp_scaling")
            pre_exp_scaling = logistic_func(logit_pre_exp_scaling)
        elif use_pre_exp_scaling and params.get("raw_pre_exp_scaling") is not None:
            pre_exp_scaling = 2 ** params.get("raw_pre_exp_scaling")
        else:
            pre_exp_scaling = 0.5
        memory_days = lamb_to_memory_days_clipped(
            logistic_func(params["logit_lamb_for_ewma"]),
            run_fingerprint["chunk_period"],
            run_fingerprint["max_memory_days"],
        )
        k = calc_k(params, memory_days)
        chunkwise_price_values = prices[:: run_fingerprint["chunk_period"]]
        gradients_channel = calc_triple_threat_gradients(
            params,
            0,
            chunkwise_price_values,
            run_fingerprint["chunk_period"],
            run_fingerprint["max_memory_days"],
            cap_lamb=True,
        )
        gradients_trend = calc_triple_threat_gradients(
            params,
            1,
            chunkwise_price_values,
            run_fingerprint["chunk_period"],
            run_fingerprint["max_memory_days"],
            cap_lamb=True,
        )
        gradients_envelope = calc_triple_threat_gradients(
            params,
            2,
            chunkwise_price_values,
            run_fingerprint["chunk_period"],
            run_fingerprint["max_memory_days"],
            cap_lamb=True,
        )
        exponents = squareplus(params.get("raw_exponents"))
        amplitude = (2 ** params.get("log_amplitude")) * memory_days
        width = 2 ** params.get("raw_width")
        rule_outputs = _jax_triple_threat_mean_reversion_channel_weight_update(
            gradients_channel,
            gradients_trend,
            gradients_envelope,
            k,
            width,
            amplitude,
            exponents,
            pre_exp_scaling=pre_exp_scaling,
        )

        return rule_outputs



[docs]
    def init_base_parameters(
        self,
        initial_values_dict: Dict[str, Any],
        run_fingerprint: Dict[str, Any],
        n_assets: int,
        n_parameter_sets: int = 1,
        noise: str = "gaussian",
    ) -> Dict[str, Any]:
        """
        Initialize parameters for a power channel pool.

        This method sets up the initial parameters for the power channel pool strategy, including
        weights, memory length (lambda), the update agressiveness (k) and the exponents.


        Parameters
        ----------
        initial_values_dict : Dict[str, Any]
            Dictionary containing initial values for various parameters.
        run_fingerprint : Dict[str, Any]
            Dictionary containing run-specific settings and parameters.
        n_assets : int
            The number of assets in the pool.
        n_parameter_sets : int, optional
            The number of parameter sets to initialize, by default 1.
        noise : str, optional
            The type of noise to apply during initialization, by default "gaussian".

        Returns
        -------
        Dict[str, jnp.array]
            Dictionary containing the initialized parameters for the momentum pool.

        Raises
        ------
        ValueError
            If required initial values are missing or in an incorrect format.

        Notes
        -----
        This method handles the initialization of parameters for initial weights, lambda
        (memory length parameter), the update agressiveness (k), the exponents and the width for each asset and parameter set.
        It processes the initial values to ensure they are in the correct format and applies
        any necessary transformations (e.g., logit transformations for lambda).
        """

        np.random.seed(0)

        # We need to initialise the weights for each parameter set
        # If a vector is provided in the inital values dict, we use
        # that, if only a singleton array is provided we expand it
        # to n_assets and use that vlaue for all assets.
        def process_initial_values(
            initial_values_dict, key, n_assets, n_parameter_sets, force_scalar=False
        ):
            if key in initial_values_dict:
                initial_value = initial_values_dict[key]
                if isinstance(initial_value, (np.ndarray, jnp.ndarray, list)):
                    initial_value = np.array(initial_value)
                    if force_scalar:
                        return np.array([initial_value] * n_parameter_sets)
                    elif initial_value.size == n_assets:
                        return np.array([initial_value] * n_parameter_sets)
                    elif initial_value.size == 1:
                        return np.array([[initial_value] * n_assets] * n_parameter_sets)
                    elif initial_value.shape == (n_parameter_sets, n_assets):
                        return initial_value
                    else:
                        raise ValueError(
                            f"{key} must be a singleton or a vector of length n_assets or a matrix of shape (n_parameter_sets, n_assets)"
                        )
                else:
                    if force_scalar:
                        return np.array([[initial_value]] * n_parameter_sets)
                    else:
                        return np.array([[initial_value] * n_assets] * n_parameter_sets)
            else:
                raise ValueError(f"initial_values_dict must contain {key}")


        initial_weights_logits = process_initial_values(
            initial_values_dict, "initial_weights_logits", n_assets, n_parameter_sets, force_scalar=False
        )
        log_k = np.log2(
            process_initial_values(
                initial_values_dict, "initial_k_per_day", n_assets, n_parameter_sets, force_scalar=run_fingerprint["optimisation_settings"]["force_scalar"]
            )
        )

        initial_lamb = memory_days_to_lamb(
            initial_values_dict["initial_memory_length"],
            run_fingerprint["chunk_period"],
        )

        logit_lamb_np = np.log(initial_lamb / (1.0 - initial_lamb))
        if run_fingerprint["optimisation_settings"]["force_scalar"]:
            logit_lamb = np.array([[[logit_lamb_np]] * 3] * n_parameter_sets)
        else:
            logit_lamb = np.array([[[logit_lamb_np] * n_assets] * 3] * n_parameter_sets)

        # lamb delta is the difference in lamb needed for
        # lamb + delta lamb to give a final memory length
        # of  initial_memory_length + initial_memory_length_delta
        initial_lamb_for_ewma = memory_days_to_lamb(
            initial_values_dict["initial_memory_length"],
            run_fingerprint["chunk_period"],
        )

        logit_lamb_for_ewma_np = np.log(
            initial_lamb_for_ewma / (1.0 - initial_lamb_for_ewma)
        )
        if run_fingerprint["optimisation_settings"]["force_scalar"]:
            logit_lamb_for_ewma = np.array([[logit_lamb_for_ewma_np]] * n_parameter_sets)
        else:
            logit_lamb_for_ewma = np.array(
                [[logit_lamb_for_ewma_np] * n_assets] * n_parameter_sets
            )

        raw_pre_exp_scaling_np = np.log2(
            initial_values_dict["initial_pre_exp_scaling"]
        )
        if run_fingerprint["optimisation_settings"]["force_scalar"]:
            raw_pre_exp_scaling = np.array([[raw_pre_exp_scaling_np]] * n_parameter_sets)
        else:
            raw_pre_exp_scaling = np.array(
                [[raw_pre_exp_scaling_np] * n_assets] * n_parameter_sets
            )

        if run_fingerprint["optimisation_settings"]["force_scalar"]:
            log_amplitude = np.array([[initial_values_dict["initial_log_amplitude"]]] * n_parameter_sets)
        else:
            log_amplitude = np.array(
                [[initial_values_dict["initial_log_amplitude"]] * n_assets]
                * n_parameter_sets
            )

        if run_fingerprint["optimisation_settings"]["force_scalar"]:
            raw_width = np.array([[initial_values_dict["initial_raw_width"]]] * n_parameter_sets)
        else:
            raw_width = np.array(
                [[initial_values_dict["initial_raw_width"]] * n_assets] * n_parameter_sets
            )

        if run_fingerprint["optimisation_settings"]["force_scalar"]:
            raw_exponents = np.array([[initial_values_dict["initial_raw_exponents"]]] * n_parameter_sets)
        else:
            raw_exponents = np.array(
                [[initial_values_dict["initial_raw_exponents"]] * n_assets]
                * n_parameter_sets
            )
        params = {
            "log_k": log_k,
            "logit_lamb": logit_lamb,
            "logit_lamb_for_ewma": logit_lamb_for_ewma,
            "initial_weights_logits": initial_weights_logits,
            "log_amplitude": log_amplitude,
            "raw_width": raw_width,
            "raw_exponents": raw_exponents,
            "raw_pre_exp_scaling": raw_pre_exp_scaling,
            "subsidary_params": [],
        }

        params = self.add_noise(params, noise, n_parameter_sets)
        return params


    @classmethod
    def _process_specific_parameters(cls, update_rule_parameters, run_fingerprint):
        """Process mean reversion channel specific parameters."""
        result = {}
        amplitude_values = None
        memory_days = None

        # Get memory_days value for amplitude calculation
        for urp in update_rule_parameters:
            if urp.name == "memory_days":
                memory_days = urp.value
                break

        # Process specific parameters
        for urp in update_rule_parameters:
            if urp.name == "amplitude":
                amplitude_values = urp.value
            elif urp.name == "exponent":
                raw_exponents = [float(inverse_squareplus_np(val)) for val in urp.value]
                if len(raw_exponents) != len(run_fingerprint["tokens"]):
                    raw_exponents = [raw_exponents[0]] * len(run_fingerprint["tokens"])
                result["raw_exponents"] = np.array(raw_exponents)
            elif urp.name == "width":
                raw_width = [float(get_raw_value(val)) for val in urp.value]
                result["raw_width"] = np.array(raw_width)
                if len(raw_width) != len(run_fingerprint["tokens"]):
                    raw_width = [raw_width[0]] * len(run_fingerprint["tokens"])
                result["raw_width"] = np.array(raw_width)
            elif urp.name == "pre_exp_scaling":
                raw_pre_exp_scaling = [float(get_raw_value(val)) for val in urp.value]
                if len(raw_pre_exp_scaling) != len(run_fingerprint["tokens"]):
                    raw_pre_exp_scaling = [raw_pre_exp_scaling[0]] * len(run_fingerprint["tokens"])
                result["raw_pre_exp_scaling"] = np.array(raw_pre_exp_scaling)

        # Process amplitude last
        if amplitude_values is not None:
            if memory_days is None:
                raise ValueError("memory_days parameter is required for amplitude calculation")
            log_amplitude = [
                get_log_amplitude(float(amp), float(mem)) 
                for amp, mem in zip(amplitude_values, memory_days)
            ]
            if len(log_amplitude) != len(run_fingerprint["tokens"]):
                log_amplitude = [log_amplitude[0]] * len(run_fingerprint["tokens"])
            result["log_amplitude"] = np.array(log_amplitude)
        return result


tree_util.register_pytree_node(
    TripleThreatMeanReversionChannelPool,
    TripleThreatMeanReversionChannelPool._tree_flatten,
    TripleThreatMeanReversionChannelPool._tree_unflatten,
)