Source code for tstrends.trend_labelling.oracle_labeller

from typing import overload, Literal

try:
    from typing import override  # Python 3.12+
except ImportError:  # pragma: no cover - fallback for older Python
    from typing_extensions import override

import numpy as np
from numpy.typing import NDArray

from .base_labeller import BaseLabeller
from .label_scaling import Labels, scale_binary, scale_ternary



[docs]
class BaseOracleTrendLabeller(BaseLabeller):
    """Base class for Oracle Trend Labellers.

    This class implements the core functionality of the Oracle Trend Labelling algorithm,
    which uses dynamic programming to find optimal trend labels by maximizing returns
    while considering transaction costs.

    The algorithm works in three main steps:
        1. Compute transition costs between states
        2. Forward pass to calculate cumulative returns
        3. Backward pass to determine optimal labels

    Attributes:
        transaction_cost (float): Cost coefficient for making a transaction between states.

    Note:
        This is an abstract base class. Concrete implementations must provide
        the _scale_labels method to define how raw labels are scaled to the
        final output format.
    """

    transaction_cost: float


[docs]
    def __init__(self, transaction_cost: float) -> None:
        """
        Initialize the base Oracle Trend Labeller.

        Args:
            transaction_cost (float): Cost of making a transaction
        """
        if not isinstance(transaction_cost, float):
            raise TypeError("transaction_cost must be a float.")
        self.transaction_cost = transaction_cost


    def _scale_labels(self, labels: NDArray[np.int_]) -> NDArray[np.int_]:
        """
        Scale the labels.
        """
        raise NotImplementedError("Subclasses must implement this method.")

    def _verify_time_series(self, time_series_list: list[float]) -> None:
        """
        Verify the input time series.
        Args:
            time_series_list (list[float]): The price series.
        """
        if not isinstance(time_series_list, list):
            raise TypeError("time_series_list must be a list.")
        if not all(isinstance(price, (int, float)) for price in time_series_list):
            raise TypeError(
                "All elements in time_series_list must be integers or floats."
            )
        if len(time_series_list) < 2:
            raise ValueError("time_series_list must contain at least two elements.")

    def _compute_transition_costs(
        self, time_series_list: NDArray[np.float64]
    ) -> NDArray[np.float64]:
        """
        Compute the transition costs.
        """
        raise NotImplementedError("Subclasses must implement this method.")

    def _forward_pass(
        self, time_series_list: NDArray[np.float64], P: NDArray[np.float64]
    ) -> NDArray[np.float64]:
        """
        Perform the forward pass to calculate the state matrix.
        """
        raise NotImplementedError("Subclasses must implement this method.")

    def _backward_pass(
        self,
        S: NDArray[np.float64],
        P: NDArray[np.float64],
        time_series_arr: NDArray[np.float64],
    ) -> NDArray[np.int_]:
        """
        Perform the backward pass to determine the trend labels.
        Args:
            S (NDArray[np.float64]): State matrix of cumulative returns.
            P (NDArray[np.float64]): Transition cost matrix.
        Returns:
            labels (NDArray[np.int_]): Optimal trend labels.
        """
        T = len(time_series_arr)
        labels = np.zeros(T, dtype=int)
        last_row = np.asarray(S[-1], dtype=np.float64)
        labels[-1] = int(np.argmax(last_row))  # Start from the last state

        for t in range(T - 2, -1, -1):
            row = np.asarray(S[t] + P[t, :, labels[t + 1]], dtype=np.float64)
            labels[t] = int(np.argmax(row))

        return labels

    @overload
    def get_labels(
        self, time_series_list: list[float], return_labels_as_int: Literal[True] = True
    ) -> list[int]: ...

    @overload
    def get_labels(
        self, time_series_list: list[float], return_labels_as_int: Literal[False]
    ) -> list[Labels]: ...


[docs]
    @override
    def get_labels(
        self, time_series_list: list[float], return_labels_as_int: bool = True
    ) -> list[int] | list[Labels]:
        """
        Run the full Oracle Trend Labeling Algorithm over a time series.

        Args:
            time_series_list (list[float]): The price series.
            return_labels_as_int (bool, optional): If True, returns integer labels (-1, 0, 1),
                                                  if False returns Labels enum values. Defaults to True.

        Returns:
            Union[list[int], list[Labels]]: Optimal trend labels. If return_labels_as_int is True, returns scaled integers,
                                          otherwise returns Labels enum values.
        """
        self._verify_time_series(time_series_list)
        time_series_arr = np.array(time_series_list, dtype=np.float64)

        P = self._compute_transition_costs(time_series_arr)
        S = self._forward_pass(time_series_arr, P)
        labels = self._backward_pass(S, P, time_series_arr)

        scaled_labels = self._scale_labels(labels)
        ints = [int(x) for x in scaled_labels.tolist()]
        if return_labels_as_int:
            return ints
        return [Labels(v) for v in ints]





[docs]
class OracleBinaryTrendLabeller(BaseOracleTrendLabeller):
    """Oracle Binary Trend Labeller.

    This class implements a binary version of the Oracle Trend Labelling algorithm,
    adapted from the paper by T. Kovačević, A. Merćep, S. Begušić and Z. Kostanjčar,
    "Optimal Trend Labeling in Financial Time Series".

    The algorithm identifies two distinct states:
        - Upward trends (label: Labels.UP or 1)
        - Downward trends (label: Labels.DOWN or -1)

    Attributes:
        transaction_cost (float): Inherited from BaseOracleTrendLabeller.

    Example:
        >>> labeller = OracleBinaryTrendLabeller(transaction_cost=0.001)
        >>> prices = [1.0, 1.15, 1.2, 1.0]
        >>> labels = labeller.get_labels(prices)
        >>> print(labels)  # [-1, 1, 1, -1]

    Note:
        The transaction cost parameter influences how readily the algorithm
        switches between trends. Higher costs result in more stable trend
        assignments.
    """


[docs]
    def __init__(self, transaction_cost: float) -> None:
        """
        Initialize the binary trend labeller.
        """
        super().__init__(transaction_cost)


    @override
    def _scale_labels(self, labels: NDArray[np.int_]) -> NDArray[np.int_]:
        """
        Scale the labels.
        """
        return scale_binary(labels)

    @override
    def _compute_transition_costs(
        self, time_series_list: NDArray[np.float64]
    ) -> NDArray[np.float64]:
        """
        Initialize the transition cost matrix.
        Args:
            time_series_list (NDArray[np.float64]): Array of price values.
        Returns:
            P (NDArray[np.float64]): Transition cost matrix of shape (T-1, 2, 2).
        """
        ts_len = len(time_series_list)

        P = np.zeros((ts_len - 1, 2, 2), dtype=np.float64)

        for t in range(ts_len - 1):
            price_change: float = time_series_list[t + 1] - time_series_list[t]
            # Staying in the same state
            P[t, 0, 0] = 0  # No cost for staying in downtrend
            P[t, 1, 1] = price_change  # Cost for staying in uptrend

            # Switching states
            P[t, 0, 1] = (
                -time_series_list[t] * self.transaction_cost
            )  # Downtrend to uptrend
            P[t, 1, 0] = (
                -time_series_list[t] * self.transaction_cost
            )  # Uptrend to downtrend

        return P

    @override
    def _forward_pass(
        self,
        time_series_list: list[float] | NDArray[np.float64],
        P: NDArray[np.float64],
    ) -> NDArray[np.float64]:
        """
        Perform the forward pass to calculate the state matrix.
        Args:
            P (NDArray[np.float64]): Transition cost matrix.
        Returns:
            S (NDArray[np.float64]): State matrix of cumulative returns.
        """
        S = np.zeros(
            (len(time_series_list), 2), dtype=np.float64
        )  # Initialize state matrix

        # Iterate over time steps in forward direction
        for t in range(1, len(time_series_list)):
            S[t, 0] = max(S[t - 1, 0] + P[t - 1, 0, 0], S[t - 1, 1] + P[t - 1, 1, 0])
            S[t, 1] = max(S[t - 1, 0] + P[t - 1, 0, 1], S[t - 1, 1] + P[t - 1, 1, 1])

        return S




[docs]
class OracleTernaryTrendLabeller(BaseOracleTrendLabeller):
    """Oracle Ternary Trend Labeller.

    This class implements an adaptation of the Oracle Trend Labelling algorithm
    to a three-state setting with dynamic programming. This consists is two main ideas,
    managing the general behaviour through the neutral state:
    1. Transitions between downtrend and uptrend must go through the neutral state.
    2. The reward for staying in the neutral state is calculated differently than
        the reward for staying in a downtrend or uptrend.

    The algorithm identifies three states:
        - Upward trends (label: Labels.UP or 1)
        - Neutral trends (label: Labels.NEUTRAL or 0)
        - Downward trends (label: Labels.DOWN or -1)

    Attributes:
        transaction_cost (float): Inherited from BaseOracleTrendLabeller.
        neutral_reward_factor (float): Coefficient for tuning the reward for staying in the neutral state.
        Lower values ease the switch into downtrends and uptrends.

    Example:
        >>> labeller = OracleTernaryTrendLabeller(transaction_cost=0.001, neutral_reward_factor=0.5)
        >>> prices = [1.0, 1.15, 1.2, 1.18, 1.0]
        >>> labels = labeller.get_labels(prices)
        >>> print(labels)  # [-1, 1, 1, 0, -1]

    Note:
        The neutral_reward_factor parameter influences how the algorithm weights price changes
        in the neutral state. The neutral_reward_factor is usually best set lower than 1.0,
        tuned up together with the transaction_cost.
    """

    neutral_reward_factor: float


[docs]
    def __init__(self, transaction_cost: float, neutral_reward_factor: float) -> None:
        """
        Initialize the ternary trend labeller.

        Args:
            transaction_cost (float): Cost coefficient for switching between trends.
            neutral_reward_factor (float): Trend coefficient for weighting price changes.
        """
        super().__init__(transaction_cost)
        if not isinstance(neutral_reward_factor, float):
            raise TypeError("neutral_reward_factor must be a float.")
        self.neutral_reward_factor = neutral_reward_factor


    @override
    def _scale_labels(self, labels: NDArray[np.int_]) -> NDArray[np.int_]:
        """
        Scale the labels.
        """
        return scale_ternary(labels)

    @override
    def _compute_transition_costs(
        self, time_series_list: NDArray[np.float64]
    ) -> NDArray[np.float64]:
        """
        Initialize the transition cost matrix for three states.

        Args:
            time_series_list (NDArray[np.float64]): Array of price values.
        Returns:
            NDArray[np.float64]: Transition cost matrix of shape (T-1, 3, 3).
        """
        T = len(time_series_list)
        P = np.full(
            (T - 1, 3, 3), -np.inf, dtype=np.float64
        )  # Initialize with -inf for forbidden transitions

        for t in range(T - 1):
            price_change: float = time_series_list[t + 1] - time_series_list[t]
            switch_cost: float = -time_series_list[t] * self.transaction_cost

            # Rewards for staying in same state
            P[t, 0, 0] = -price_change  # Reward for staying in downtrend
            P[t, 1, 1] = (
                abs(price_change) * self.neutral_reward_factor
            )  # No reward for staying neutral
            P[t, 2, 2] = price_change  # Reward for staying in uptrend

            # Rewards for allowed transitions
            P[t, 0, 1] = switch_cost  # Downtrend to neutral
            P[t, 1, 0] = switch_cost  # Neutral to downtrend
            P[t, 1, 2] = switch_cost  # Neutral to uptrend
            P[t, 2, 1] = switch_cost  # Uptrend to neutral

        return P

    @override
    def _forward_pass(
        self,
        time_series_list: list[float] | NDArray[np.float64],
        P: NDArray[np.float64],
    ) -> NDArray[np.float64]:
        """
        Perform the forward pass to calculate the state matrix.

        Args:
            time_series_list (list[float]): The price series.
            P (NDArray[np.float64]): Transition cost matrix.

        Returns:
            NDArray[np.float64]: State matrix of cumulative returns.
        """
        T = len(time_series_list)
        S = np.zeros((T, 3), dtype=np.float64)  # Initialize state matrix for 3 states

        # Iterate over time steps in forward direction
        for t in range(1, T):
            # Maximum return for being in downtrend
            S[t, 0] = max(
                S[t - 1, 0] + P[t - 1, 0, 0],  # Stay in downtrend
                S[t - 1, 1] + P[t - 1, 1, 0],  # Switch from neutral
            )

            # Maximum return for being in neutral
            S[t, 1] = max(
                S[t - 1, 0] + P[t - 1, 0, 1],  # Switch from downtrend
                S[t - 1, 1] + P[t - 1, 1, 1],  # Stay in neutral
                S[t - 1, 2] + P[t - 1, 2, 1],  # Switch from uptrend
            )

            # Maximum return for being in uptrend
            S[t, 2] = max(
                S[t - 1, 1] + P[t - 1, 1, 2],  # Switch from neutral
                S[t - 1, 2] + P[t - 1, 2, 2],  # Stay in uptrend
            )

        return S