Source code for vangja.time_series

"""Time series model classes for vangja.

This module provides the core time series modeling classes that support
additive and multiplicative composition of model components.

Classes
-------
TimeSeriesModel
    Base class for all time series model components.
AdditiveTimeSeries
    Combination of two components using addition.
MultiplicativeTimeSeries
    Combination of two components using y = left * (1 + right).
SimpleMultiplicativeTimeSeries
    Combination of two components using y = left * right.
CombinedTimeSeries
    Base class for combined time series models.
"""

import arviz as az
import matplotlib.pyplot as plt
import numpy as np
import pandas as pd
import pymc as pm
import pymc_extras as pmx

from vangja.types import (
    FreqStr,
    Method,
    NutsSampler,
    OptimizationMethod,
    PoolType,
    ScaleMode,
    Scaler,
    TScaleParams,
    YScaleParams,
)
from vangja.utils import get_group_definition



[docs]
class TimeSeriesModel:
    """Base class for time series model components.

    This class provides the foundation for building time series models in vangja.
    It handles data preprocessing, scaling, model fitting, and prediction. Model
    components can be combined using arithmetic operators (+, *, **) to create
    complex models.

    Attributes
    ----------
    data : pd.DataFrame
        The processed training data after fitting.
    y_scale_params : YScaleParams | dict[int, YScaleParams]
        Scaling parameters for the target variable y. Either a single dict for
        complete scaling or a dict of dicts for individual scaling.
    t_scale_params : TScaleParams
        Scaling parameters for the time variable t.
    group : np.ndarray
        Array of group codes for each data point.
    n_groups : int
        Number of unique groups/series in the data.
    groups_ : dict[int, str]
        Mapping from group codes to series names.
    model : pm.Model
        The PyMC model after fitting.
    model_idxs : dict[str, int]
        Counter for component indices by type.
    samples : int
        Number of posterior samples (for MCMC/VI methods).
    method : Method
        The inference method used for fitting.
    initvals : dict[str, float]
        Initial values for model parameters.
    map_approx : dict[str, np.ndarray] | None
        MAP parameter estimates (if using MAP inference).
    trace : az.InferenceData | None
        Posterior samples (if using MCMC/VI inference).

    Examples
    --------
    >>> from vangja import LinearTrend, FourierSeasonality
    >>> # Create an additive model
    >>> model = LinearTrend() + FourierSeasonality(period=365.25, series_order=10)
    >>> model.fit(data)
    >>> predictions = model.predict(horizon=30)

    >>> # Create a multiplicative model
    >>> model = LinearTrend() ** FourierSeasonality(period=7, series_order=3)
    >>> model.fit(data)

    Notes
    -----
    Subclasses should implement:
    - `definition`: Add parameters to the PyMC model
    - `_get_initval`: Provide initial values for parameters
    - `_predict_map`: Predict using MAP estimates
    - `_predict_mcmc`: Predict using MCMC samples
    - `_plot`: Plot the component's contribution
    """

    data: pd.DataFrame
    y_scale_params: YScaleParams | dict[int, YScaleParams]
    t_scale_params: TScaleParams

    group: np.ndarray
    n_groups: int
    groups_: dict[int, str]

    model: pm.Model
    model_idxs: dict[str, int]
    samples: int
    method: Method
    initvals: dict[str, float]
    map_approx: dict[str, np.ndarray] | None
    trace: az.InferenceData | None

    _predict_columns: dict[str, np.ndarray]

    def _get_leaf_components(self) -> list["TimeSeriesModel"]:
        """Return leaf components of the model tree.

        For a leaf component, returns itself. Combined models override
        this to recursively collect from children.

        Returns
        -------
        list[TimeSeriesModel]
            List of leaf components.
        """
        return [self]

    def _collect_predict_columns(self) -> dict[str, np.ndarray]:
        """Collect all pending prediction columns from leaf components.

        Gathers ``_predict_columns`` dicts stored by each leaf component
        during ``_predict_map`` / ``_predict_mcmc`` and merges them.

        Returns
        -------
        dict[str, np.ndarray]
            Merged mapping of column names to value arrays.
        """
        all_cols: dict[str, np.ndarray] = {}
        for leaf in self._get_leaf_components():
            all_cols.update(getattr(leaf, "_predict_columns", {}))
        return all_cols

    def _get_scale_params(
        self, series: pd.DataFrame, scaler: Scaler, t_scale_params: TScaleParams | None
    ) -> tuple[TScaleParams, YScaleParams]:
        return (
            (
                t_scale_params
                if t_scale_params is not None
                else {
                    "ds_min": series["ds"].min(),
                    "ds_max": series["ds"].max(),
                }
            ),
            {
                "scaler": scaler,
                "y_min": 0 if scaler == "maxabs" else series["y"].min(),
                "y_max": (
                    series["y"].abs().max() if scaler == "maxabs" else series["y"].max()
                ),
            },
        )

    def _process_data(
        self,
        data: pd.DataFrame,
        scaler: Scaler,
        scale_mode: ScaleMode,
        t_scale_params: TScaleParams | None,
    ) -> None:
        """Converts dataframe to correct format and scale dates and values.

        Parameters
        ----------
        data : pd.DataFrame
            A pandas dataframe that must at least have columns ds (predictor) and
            y (target). Column series (name of time series) is optional.
        scaler: Scaler
            Whether to use maxabs or minmax scaling of the y (target).
        scale_mode: ScaleMode
            Whether to scale each series individually or together.
        t_scale_params: TScaleParams | None
            Whether to override scale parameters for ds (predictor).
        """
        self.data = data.reset_index(drop=True).dropna()
        self.data["ds"] = pd.to_datetime(self.data["ds"])
        self.data["t"] = 0.0
        self.data["y"] = self.data["y"].astype(float)
        if "series" not in self.data.columns:
            self.data["series"] = "series"

        self.data.sort_values("ds", inplace=True)

        self.group, self.n_groups, self.groups_ = get_group_definition(
            self.data, "partial"
        )

        if scale_mode == "individual":
            self.t_scale_params, _ = self._get_scale_params(
                self.data, scaler, t_scale_params
            )
            self.y_scale_params = {}

            for group_code, group_name in self.groups_.items():
                _, y_params = self._get_scale_params(
                    self.data[self.data["series"] == group_name], scaler, t_scale_params
                )

                self.data.loc[self.data["series"] == group_name, "t"] = (
                    self.data.loc[self.data["series"] == group_name, "ds"]
                    - self.t_scale_params["ds_min"]
                ) / (self.t_scale_params["ds_max"] - self.t_scale_params["ds_min"])
                self.data.loc[self.data["series"] == group_name, "y"] = (
                    self.data.loc[self.data["series"] == group_name, "y"]
                    - y_params["y_min"]
                ) / (y_params["y_max"] - y_params["y_min"])

                self.y_scale_params[group_code] = y_params

            return

        self.t_scale_params, self.y_scale_params = self._get_scale_params(
            self.data, scaler, t_scale_params
        )
        self.data["t"] = (self.data["ds"] - self.t_scale_params["ds_min"]) / (
            self.t_scale_params["ds_max"] - self.t_scale_params["ds_min"]
        )
        self.data["y"] = (self.data["y"] - self.y_scale_params["y_min"]) / (
            self.y_scale_params["y_max"] - self.y_scale_params["y_min"]
        )

    def _get_model_initvals(self) -> dict[str, float]:
        """Calculate initvals based on data."""
        initvals: dict[str, float] = {"sigma": 1.0}
        for key in self.groups_.keys():
            series: pd.DataFrame = self.data[self.group == key]
            i0, i1 = series["ds"].idxmin(), series["ds"].idxmax()
            T = series["t"].loc[i1] - series["t"].loc[i0]
            slope = (series["y"].loc[i1] - series["y"].loc[i0]) / T
            intercept = series["y"].loc[i0] - slope * series["t"].loc[i0]
            initvals[f"slope_{key}"] = slope
            initvals[f"intercept_{key}"] = intercept

        return initvals


[docs]
    def get_initval(self, initvals: dict[str, float], model: pm.Model) -> dict:
        """Get the initval of the standard deviation of the Normal prior of y (target).

        Parameters
        ----------
        initvals: dict[str, float]
            Calculated initvals based on data.
        model: pm.Model
            The model for which the initvals will be set.
        """
        sigma_var = model.named_vars["sigma"]
        sigma_val = initvals.get("sigma", 1)

        sigma_initvals = {}
        # Only set initvals for sigma if it's a free RV (skip Deterministic
        # sigma from partial pooling, which is determined by its parents)
        if sigma_var in model.free_RVs:
            # For individual pooling, sigma has shape (n_groups,) — broadcast
            # scalar initval to match the variable shape
            if sigma_var.type.ndim > 0:
                sigma_initvals[sigma_var] = np.ones(self.n_groups) * sigma_val
            else:
                sigma_initvals[sigma_var] = sigma_val

        return {
            **sigma_initvals,
            **self._get_initval(initvals, model),
        }



[docs]
    def fit(
        self,
        data: pd.DataFrame,
        scaler: Scaler = "maxabs",
        scale_mode: ScaleMode = "complete",
        t_scale_params: TScaleParams | None = None,
        sigma_sd: float = 0.5,
        sigma_pool_type: PoolType = "complete",
        sigma_shrinkage_strength: float = 1,
        method: Method = "mapx",
        optimization_method: OptimizationMethod = "L-BFGS-B",
        maxiter: int = 10000,
        n: int = 10000,
        samples: int = 1000,
        chains: int = 4,
        cores: int = 4,
        nuts_sampler: NutsSampler = "pymc",
        progressbar: bool = True,
        idata: az.InferenceData | None = None,
    ):
        """
        Create and fit the model to the data.

        Parameters
        ----------
        data : pd.DataFrame
            A pandas dataframe that must at least have columns ds (predictor), y
            (target) and series (name of time series).
        scaler: Scaler
            Whether to use maxabs or minmax scaling of the y (target).
        scale_mode: ScaleMode
            Whether to scale each series individually or together.
        t_scale_params: TScaleParams | None
            Whether to override scale parameters for ds (predictor).
        sigma_sd: float
            The standard deviation of the Normal prior of y (target).
        sigma_pool_type: PoolType
            Type of pooling for the sigma parameter that is performed when sampling.
        sigma_shrinkage_strength: float
            Shrinkage between groups for the hierarchical modeling.
        method: Method
            The Bayesian inference method to be used. Either a point estimate MAP), a
            VI method (advi etc.) or full Bayesian sampling (MCMC).
        optimization_method: OptimizationMethod
            The optimization method to be used for MAP inference. See
            scipy.optimize.minimize documentation for details.
        maxiter: int
            The maximum number of iterations for the L-BFGS-B optimization algorithm
            when using MAP inference.
        n: int
            The number of iterations to be used for the VI methods.
        samples: int
            Denotes the number of samples to be drawn from the posterior for MCMC and
            VI methods.
        chains: int
            Denotes the number of independent chains drawn from the posterior. Only
            applicable to the MCMC methods.
        nuts_sampler: NutsSampler
            The sampler for the NUTS method.
        progressbar: bool
            Whether to show a progressbar while fitting the model.
        idata: az.InferenceData | None
            Sample from a posterior. If it is not None, Vangja will use this to set the
            parameters' priors in the model. If idata is not None, each component from
            the model should specify how idata should be used to set its parameters'
            priors.
        """
        self._process_data(data, scaler, scale_mode, t_scale_params)

        self.model = pm.Model()
        self.model_idxs = {}
        self.samples = samples
        self.method = method

        with self.model:
            priors = None
            if idata is not None and self.needs_priors():
                # Pre-assign model indices so components can declare
                # which posterior variables they need for transfer learning.
                pre_idxs: dict[str, int] = {}
                self._assign_model_idx(pre_idxs)

                needed_vars = self._get_prior_var_names()
                # Only include variables that actually exist in the posterior
                available = set(idata["posterior"].data_vars)
                prior_vars = {
                    var: f"prior_{var}" for var in needed_vars if var in available
                }

                if prior_vars:
                    priors = pmx.utils.prior.prior_from_idata(
                        idata,
                        name="priors",
                        **prior_vars,
                    )

            mu = self.definition(self.model, self.data, self.model_idxs, priors, idata)
            if sigma_pool_type == "partial":
                sigma_sigma = pm.HalfCauchy(
                    "sigma_sigma", sigma_sd / sigma_shrinkage_strength
                )
                sigma_offset = pm.HalfNormal("sigma_offset", 1, shape=self.n_groups)
                sigma = pm.Deterministic("sigma", sigma_offset * sigma_sigma)
                _ = pm.Normal(
                    "obs", mu=mu, sigma=sigma[self.group], observed=self.data["y"]
                )
            elif sigma_pool_type == "individual":
                sigma = pm.HalfNormal("sigma", sigma_sd, shape=self.n_groups)
                _ = pm.Normal(
                    "obs", mu=mu, sigma=sigma[self.group], observed=self.data["y"]
                )
            else:
                sigma = pm.HalfNormal("sigma", sigma_sd)
                _ = pm.Normal("obs", mu=mu, sigma=sigma, observed=self.data["y"])

            self.map_approx = None
            self.trace = None

        self.initvals = self._get_model_initvals()
        initval_dict = self.get_initval(self.initvals, self.model)

        with self.model:
            if self.method == "mapx":
                map_result = pmx.find_MAP(
                    method=optimization_method,
                    use_grad=True,
                    initvals=initval_dict,
                    progressbar=progressbar,
                    gradient_backend="jax",
                    compile_kwargs={"mode": "JAX"},
                    options={"maxiter": maxiter},
                )
                # Convert InferenceData to dict format for consistent access
                self.map_approx = {
                    var: map_result.posterior[var].values.squeeze()
                    for var in map_result.posterior.data_vars
                }
            elif self.method == "map":
                self.map_approx = pm.find_MAP(
                    start=initval_dict,
                    method=optimization_method,
                    progressbar=progressbar,
                    maxeval=maxiter,
                )
            elif self.method in ["fullrank_advi", "advi", "svgd", "asvgd"]:
                approx = pm.fit(
                    n,
                    method=self.method,
                    start=initval_dict if self.method != "asvgd" else None,
                    progressbar=progressbar,
                )
                self.trace = approx.sample(draws=self.samples)
            elif self.method in ["nuts", "metropolis", "demetropolisz"]:
                step = pm.NUTS()
                if self.method == "metropolis":
                    step = pm.Metropolis()

                if self.method == "demetropolisz":
                    step = pm.DEMetropolisZ()

                self.trace = pm.sample(
                    self.samples,
                    chains=chains,
                    cores=cores,
                    nuts_sampler=nuts_sampler,
                    initvals=initval_dict,
                    step=step,
                    progressbar=progressbar,
                )
            else:
                raise NotImplementedError(
                    f"Method {self.method} is not supported at the moment!"
                )


    def _make_future_df(self, horizon: int, freq: FreqStr = "D"):
        """
        Create a dataframe for inference.

        Parameters
        ----------
        horizon: int
            The number of steps in the future that we are forecasting.
        freq: FreqStr
            The distance between the forecasting steps.
        """
        future = pd.DataFrame(
            {
                "ds": pd.DatetimeIndex(
                    np.hstack(
                        (
                            pd.date_range(
                                self.t_scale_params["ds_min"],
                                self.t_scale_params["ds_max"],
                                freq="D",
                            ).to_numpy(),
                            pd.date_range(
                                self.t_scale_params["ds_max"],
                                self.t_scale_params["ds_max"]
                                + pd.Timedelta(horizon, freq),
                                inclusive="right",
                            ).to_numpy(),
                        )
                    )
                )
            }
        )
        future["t"] = (future["ds"] - self.t_scale_params["ds_min"]) / (
            self.t_scale_params["ds_max"] - self.t_scale_params["ds_min"]
        )
        return future


[docs]
    def predict(self, horizon: int, freq: FreqStr = "D"):
        """
        Perform out-of-sample inference.

        Parameters
        ----------
        horizon: int
            The number of steps in the future that we are forecasting.
        freq: FreqStr
            The distance between the forecasting steps.
        """
        future = self._make_future_df(horizon, freq)
        forecasts = self._predict(future, self.method, self.map_approx, self.trace)
        # TODO come up with a better way to check this
        is_individual = "scaler" not in self.y_scale_params

        # Collect component columns set during _predict
        new_cols = self._collect_predict_columns()

        for group_code in range(forecasts.shape[0]):
            y_min, y_max = self._get_y_bounds(group_code, is_individual)
            scale = y_max - y_min

            new_cols[f"yhat_{group_code}"] = forecasts[group_code] * scale + y_min

            for model_type, model_cnt in self.model_idxs.items():
                if model_type.startswith("lt") is False:
                    continue
                for model_idx in range(model_cnt):
                    component = f"{model_type}_{model_idx}_{group_code}"
                    if component in new_cols:
                        new_cols[component] = new_cols[component] * scale + y_min

        return pd.concat([future, pd.DataFrame(new_cols, index=future.index)], axis=1)



[docs]
    def predict_uncertainty(
        self,
        horizon: int,
        freq: FreqStr = "D",
        uncertainty_samples: int = 200,
        interval_width: float = 0.95,
    ) -> pd.DataFrame:
        """Predict with uncertainty intervals.

        For MCMC/VI methods, uncertainty is derived from posterior samples.
        Each posterior draw is propagated through the model to produce a
        family of prediction trajectories, from which percentile-based
        credible intervals are computed.

        For MAP methods, uncertainty is estimated using a hybrid approach:

        1. The fitted observation noise ``sigma`` provides a base noise level.
        2. In-sample residuals are used to calibrate the noise estimate.
        3. A forecast-distance scaling factor ``sqrt(1 + h/n)`` widens
           the intervals for predictions further from the training data,
           reflecting increasing epistemic uncertainty.

        Parameters
        ----------
        horizon : int
            Number of future steps to forecast.
        freq : FreqStr, default "D"
            Frequency of forecast steps.
        uncertainty_samples : int, default 200
            Number of posterior draws to use for interval estimation.
            Only used for MCMC/VI methods.
        interval_width : float, default 0.95
            Width of the prediction interval (e.g. 0.95 for 95%% interval).

        Returns
        -------
        pd.DataFrame
            The future DataFrame with columns ``yhat_<group>``,
            ``yhat_lower_<group>``, and ``yhat_upper_<group>`` for each group.

        Notes
        -----
        See ``uncertainty.md`` for a detailed description of the approaches.
        """
        future = self._make_future_df(horizon, freq)
        is_individual = "scaler" not in self.y_scale_params
        alpha = 1.0 - interval_width
        lower_q = alpha / 2.0
        upper_q = 1.0 - alpha / 2.0

        # Collect all new columns here, then concat at the end
        new_cols: dict[str, np.ndarray] = {}

        if self.method not in ["mapx", "map"] and self.trace is not None:
            # --- MCMC / VI: propagate posterior draws ---
            posterior = self.trace.posterior
            n_chains = posterior.dims["chain"]
            n_draws = posterior.dims["draw"]
            total_draws = n_chains * n_draws
            n_samples = min(uncertainty_samples, total_draws)

            # Sub-sample draw indices
            rng = np.random.default_rng(42)
            flat_indices = rng.choice(total_draws, size=n_samples, replace=False)
            chain_indices = flat_indices % n_chains
            draw_indices = flat_indices // n_chains

            all_predictions = []
            for s in range(n_samples):
                ci, di = int(chain_indices[s]), int(draw_indices[s])
                draw_dict: dict[str, np.ndarray] = {}
                for var in posterior.data_vars:
                    draw_dict[var] = posterior[var].values[ci, di]

                future_copy = future[["ds", "t"]].copy()
                pred = self._predict(future_copy, "mapx", draw_dict, None)
                all_predictions.append(pred)

            # all_predictions: list of (n_groups, n_timepoints) arrays
            stacked = np.stack(all_predictions, axis=0)  # (n_samples, n_groups, T)

            # Point forecast from mean
            forecasts = self._predict(future, self.method, self.map_approx, self.trace)

            # Collect component columns before any further _predict calls
            new_cols.update(self._collect_predict_columns())

            for group_code in range(forecasts.shape[0]):
                y_min, y_max = self._get_y_bounds(group_code, is_individual)
                scale = y_max - y_min

                new_cols[f"yhat_{group_code}"] = forecasts[group_code] * scale + y_min

                group_samples = stacked[:, group_code, :]  # (n_samples, T)
                new_cols[f"yhat_lower_{group_code}"] = (
                    np.quantile(group_samples, lower_q, axis=0) * scale + y_min
                )
                new_cols[f"yhat_upper_{group_code}"] = (
                    np.quantile(group_samples, upper_q, axis=0) * scale + y_min
                )
        else:
            # --- MAP / MAPX: residual-calibrated intervals ---
            forecasts = self._predict(future, self.method, self.map_approx, self.trace)

            # Collect component columns before _compute_residual_stds
            # (which calls _predict again and would overwrite them)
            new_cols.update(self._collect_predict_columns())

            # Get fitted sigma from map_approx
            sigma_scaled = self._get_map_sigma()

            # Compute in-sample residuals for calibration
            residual_stds = self._compute_residual_stds(is_individual)

            # Number of training observations per group
            n_train = len(self.data)

            for group_code in range(forecasts.shape[0]):
                y_min, y_max = self._get_y_bounds(group_code, is_individual)
                scale = y_max - y_min

                yhat = forecasts[group_code] * scale + y_min
                new_cols[f"yhat_{group_code}"] = yhat

                # Noise estimate: use the larger of fitted sigma and residual std
                noise_scaled = max(
                    (
                        sigma_scaled[group_code]
                        if len(sigma_scaled) > 1
                        else sigma_scaled[0]
                    ),
                    residual_stds.get(group_code, sigma_scaled[0]),
                )

                # Forecast-distance scaling: uncertainty grows for predictions
                # further from the training data
                ds_max = pd.Timestamp(self.t_scale_params["ds_max"])
                forecast_distances = np.maximum(
                    (future["ds"] - ds_max).dt.days.values, 0
                ).astype(float)
                distance_scaling = np.sqrt(1.0 + forecast_distances / max(n_train, 1))

                # Convert from Student-t quantile for small samples
                from scipy import stats as sp_stats

                dof = max(n_train - 2, 1)
                z = sp_stats.t.ppf(upper_q, dof)

                half_width = z * noise_scaled * distance_scaling * scale

                new_cols[f"yhat_lower_{group_code}"] = yhat - half_width
                new_cols[f"yhat_upper_{group_code}"] = yhat + half_width

        # Rescale trend component columns (same as predict)
        for group_code in range(forecasts.shape[0]):
            y_min, y_max = self._get_y_bounds(group_code, is_individual)
            scale = y_max - y_min
            for model_type, model_cnt in self.model_idxs.items():
                if not model_type.startswith("lt"):
                    continue
                for model_idx in range(model_cnt):
                    component = f"{model_type}_{model_idx}_{group_code}"
                    if component in new_cols:
                        new_cols[component] = new_cols[component] * scale + y_min

        return pd.concat([future, pd.DataFrame(new_cols, index=future.index)], axis=1)


    def _get_y_bounds(
        self, group_code: int, is_individual: bool
    ) -> tuple[float, float]:
        """Get y_min, y_max for a given group."""
        if is_individual:
            return (
                self.y_scale_params[group_code]["y_min"],
                self.y_scale_params[group_code]["y_max"],
            )
        return self.y_scale_params["y_min"], self.y_scale_params["y_max"]

    def _get_map_sigma(self) -> np.ndarray:
        """Extract the fitted sigma values from map_approx.

        Returns
        -------
        np.ndarray
            Array of sigma values (one per group, or one shared value).
        """
        if self.map_approx is not None and "sigma" in self.map_approx:
            sigma = np.atleast_1d(self.map_approx["sigma"])
            return sigma
        # Fallback: estimate from the prior default
        return np.array([0.5])

    def _compute_residual_stds(self, is_individual: bool) -> dict[int, float]:
        """Compute per-group residual standard deviations from in-sample fit.

        Returns
        -------
        dict[int, float]
            Mapping from group_code to residual standard deviation (scaled).
        """
        result: dict[int, float] = {}
        try:
            # Predict on training data
            future_train = self.data[["ds", "t"]].copy()
            in_sample = self._predict(
                future_train, self.method, self.map_approx, self.trace
            )
            for group_code in range(in_sample.shape[0]):
                group_mask = self.group == group_code
                y_true = self.data.loc[group_mask, "y"].values
                y_pred = in_sample[group_code][group_mask]
                residuals = y_true - y_pred
                result[group_code] = float(np.std(residuals))
        except Exception:
            pass
        return result

    def _predict(
        self,
        future: pd.DataFrame,
        method: Method,
        map_approx: dict[str, np.ndarray] | None,
        trace: az.InferenceData | None,
    ):
        """
        Perform out-of-sample inference for each component.

        Parameters
        ----------
        future: pd.DataFrame
            Pandas dataframe containing the timestamps for which inference should be
            performed.
        method: Method
            The Bayesian inference method to be used. Either a point estimate MAP), a
            VI method (advi etc.) or full Bayesian sampling (MCMC).
        map_approx: dict[str, np.ndarray] | None
            The MAP posterior parameter estimate obtained with the Bayesian inference.
        trace: az.InferenceData | None
            Samples from the posterior obtained with the Bayesian inference.
        """
        if method in ["mapx", "map"]:
            return self._predict_map(future, map_approx)

        return self._predict_mcmc(future, trace)


[docs]
    def plot(
        self,
        future: pd.DataFrame,
        series: str = "series",
        y_true: pd.DataFrame | None = None,
        clip_to_data: bool = True,
    ):
        """
        Plot the inference results for a given series.

        Parameters
        ----------
        future : pd.DataFrame
            Pandas dataframe containing the timestamps for which inference should be
            performed.
        series : str
            The name of the time series.
        y_true : pd.DataFrame | None
            A pandas dataframe containing the true values for the inference period that
            must at least have columns ds (predictor), y (target) and series (name of
            time series).
        clip_to_data : bool
            If True, clip predictions to the date range of the training data
            (and y_true if provided). This avoids plotting predictions for
            periods before the target series' start date, which can happen
            when transfer learning shifts t_scale_params.
        """
        group_code: int | None = None
        for group_code_, group_name in self.groups_.items():
            if group_name == series:
                group_code = group_code_

        if group_code is None:
            raise ValueError(f"Time series {series} is not present in the dataset!")

        # Check if we have individual scaling
        is_individual = "scaler" not in self.y_scale_params

        # Filter data to only show the specific series
        series_data = self.data[self.data["series"] == series]

        # Clip future to target series date range when requested
        plot_future = future
        if clip_to_data:
            date_min = series_data["ds"].min()
            if y_true is not None:
                y_true_series = y_true.copy()
                if "series" not in y_true_series.columns:
                    y_true_series["series"] = "series"
                y_true_dates = y_true_series[y_true_series["series"] == series]["ds"]
                date_max = max(series_data["ds"].max(), y_true_dates.max())
            else:
                date_max = series_data["ds"].max()
            # Add a small buffer beyond last date for visibility
            plot_future = future[
                (future["ds"] >= date_min) & (future["ds"] <= date_max)
            ]

        plt.figure(figsize=(14, 100 * 6))
        plt.subplot(100, 1, 1)
        plt.title("Predictions")
        plt.grid()

        # Get the correct y_max and y_min for this series
        if is_individual:
            y_min = self.y_scale_params[group_code]["y_min"]
            y_max = self.y_scale_params[group_code]["y_max"]
        else:
            y_min = self.y_scale_params["y_min"]
            y_max = self.y_scale_params["y_max"]

        plt.scatter(
            series_data["ds"],
            series_data["y"] * (y_max - y_min) + y_min,
            s=3,
            color="C0",
            label="train y",
        )

        processed_y_true = None
        if y_true is not None:
            processed_y_true = y_true.copy()
            if "series" not in processed_y_true.columns:
                processed_y_true["series"] = "series"

        if processed_y_true is not None:
            plt.scatter(
                processed_y_true[processed_y_true["series"] == series]["ds"],
                processed_y_true[processed_y_true["series"] == series]["y"],
                s=3,
                color="C1",
                label="y_true",
            )

        plt.plot(
            plot_future["ds"],
            plot_future[f"yhat_{group_code}"],
            lw=1,
            label=r"$\widehat{y}$",
        )

        # Plot uncertainty bands if present
        lower_col = f"yhat_lower_{group_code}"
        upper_col = f"yhat_upper_{group_code}"
        if lower_col in plot_future.columns and upper_col in plot_future.columns:
            plt.fill_between(
                plot_future["ds"],
                plot_future[lower_col],
                plot_future[upper_col],
                alpha=0.2,
                color="C0",
                label="Uncertainty",
            )

        plt.legend()
        plot_params = {"idx": 1}
        self._plot(
            plot_params,
            plot_future,
            self.data,
            self.y_scale_params,
            processed_y_true,
            group_code,
        )



[docs]
    def sample_prior_predictive(self, samples: int = 500) -> az.InferenceData:
        """Sample from the prior predictive distribution.

        Generates simulated observations from the model's priors *before*
        conditioning on data, enabling visual and quantitative verification
        that the chosen priors are scientifically plausible.

        Parameters
        ----------
        samples : int, default 500
            Number of samples to draw from the prior predictive.

        Returns
        -------
        az.InferenceData
            ArviZ InferenceData with ``prior`` and ``prior_predictive`` groups.

        Raises
        ------
        RuntimeError
            If the model has not been fit yet (``self.model`` does not exist).

        Notes
        -----
        The model must be fit first so that the PyMC model graph exists.
        Calling this method does **not** alter the fitted posterior.

        Examples
        --------
        >>> model = LinearTrend() + FourierSeasonality(365.25, 10)
        >>> model.fit(data, method="mapx")
        >>> prior_pred = model.sample_prior_predictive(samples=200)
        """
        if not hasattr(self, "model"):
            raise RuntimeError("Model must be fit before sampling prior predictive.")
        with self.model:
            return pm.sample_prior_predictive(samples=samples)



[docs]
    def sample_posterior_predictive(self) -> az.InferenceData:
        """Sample from the posterior predictive distribution.

        Generates replicated datasets from the posterior to assess goodness of
        fit.  Requires the model to have been fitted with an MCMC or VI
        method so that ``self.trace`` is available.

        Returns
        -------
        az.InferenceData
            ArviZ InferenceData with a ``posterior_predictive`` group added.

        Raises
        ------
        RuntimeError
            If the model has not been fit yet.
        ValueError
            If the model was fit with a MAP method (no posterior trace).

        Examples
        --------
        >>> model.fit(data, method="nuts")
        >>> ppc = model.sample_posterior_predictive()
        """
        if not hasattr(self, "model"):
            raise RuntimeError(
                "Model must be fit before sampling posterior predictive."
            )
        if self.trace is None:
            raise ValueError(
                "Posterior predictive checks require posterior samples. "
                "Fit the model with an MCMC or VI method (e.g., method='nuts')."
            )
        with self.model:
            return pm.sample_posterior_predictive(self.trace)



[docs]
    def convergence_summary(self, var_names: list[str] | None = None) -> pd.DataFrame:
        """Return an ArviZ convergence summary table.

        Reports posterior mean, sd, HDI, R-hat, and ESS for every (or
        selected) model parameter.

        Parameters
        ----------
        var_names : list[str] or None, default None
            Subset of variable names to include.  ``None`` includes all.

        Returns
        -------
        pd.DataFrame
            Summary table produced by ``az.summary``.

        Raises
        ------
        ValueError
            If the model was fit with MAP (no trace).

        Examples
        --------
        >>> model.fit(data, method="nuts")
        >>> model.convergence_summary()
        """
        if self.trace is None:
            raise ValueError(
                "Convergence diagnostics require posterior samples. "
                "Fit with an MCMC or VI method."
            )
        return az.summary(self.trace, var_names=var_names)



[docs]
    def plot_trace(self, var_names: list[str] | None = None, **kwargs):
        """Plot trace and posterior density for model parameters.

        A thin wrapper around ``az.plot_trace``.

        Parameters
        ----------
        var_names : list[str] or None, default None
            Variables to include.  ``None`` plots all.
        **kwargs
            Additional keyword arguments forwarded to ``az.plot_trace``.

        Returns
        -------
        matplotlib.axes.Axes
            The plot axes.

        Raises
        ------
        ValueError
            If no trace is available.
        """
        if self.trace is None:
            raise ValueError("Trace plots require posterior samples.")
        return az.plot_trace(self.trace, var_names=var_names, **kwargs)



[docs]
    def plot_energy(self, **kwargs):
        """Plot energy diagnostics for HMC/NUTS samplers.

        Wraps ``az.plot_energy`` and reports the Bayesian Fraction of Missing
        Information (BFMI).

        Parameters
        ----------
        **kwargs
            Additional keyword arguments forwarded to ``az.plot_energy``.

        Returns
        -------
        matplotlib.axes.Axes
            The plot axes.
        """
        if self.trace is None:
            raise ValueError("Energy plots require posterior samples.")
        return az.plot_energy(self.trace, **kwargs)



[docs]
    def plot_posterior(self, var_names: list[str] | None = None, **kwargs):
        """Plot posterior density for model parameters.

        Parameters
        ----------
        var_names : list[str] or None, default None
            Variables to include.
        **kwargs
            Forwarded to ``az.plot_posterior``.

        Returns
        -------
        matplotlib.axes.Axes
        """
        if self.trace is None:
            raise ValueError("Posterior plots require posterior samples.")
        return az.plot_posterior(self.trace, var_names=var_names, **kwargs)



[docs]
    def summary(self, var_names: list[str] | None = None) -> pd.DataFrame:
        """Return a formatted posterior summary table.

        For MCMC/VI models returns mean, sd, hdi_3%, hdi_97%, R-hat, and ESS.
        For MAP models returns the point estimates.

        Parameters
        ----------
        var_names : list[str] or None
            Parameter names to include.

        Returns
        -------
        pd.DataFrame
        """
        if self.trace is not None:
            return az.summary(self.trace, var_names=var_names)
        if self.map_approx is not None:
            rows = {}
            for k, v in self.map_approx.items():
                val = np.atleast_1d(v)
                if val.ndim == 0:
                    rows[k] = {"map_estimate": float(val)}
                else:
                    for i, vi in enumerate(val.flat):
                        rows[f"{k}[{i}]"] = {"map_estimate": float(vi)}
            return pd.DataFrame(rows).T
        raise ValueError("Model has not been fit yet.")



[docs]
    def compute_log_likelihood(self) -> None:
        """Compute log-likelihood for each observation and add to trace.

        This is required for WAIC and LOO-CV calculations. If the trace already
        contains log-likelihood, this method does nothing.

        Raises
        ------
        ValueError
            If no trace is available or the model has not been fit yet.
        """
        if self.trace is None:
            raise ValueError("Log-likelihood computation requires posterior samples.")

        if not hasattr(self.trace, "log_likelihood"):
            with self.model:
                pm.compute_log_likelihood(self.trace)



[docs]
    def waic(self) -> az.ELPDData:
        """Compute the Widely Applicable Information Criterion.

        Returns
        -------
        az.ELPDData
            WAIC result object.

        Raises
        ------
        ValueError
            If no trace is available or the trace lacks log-likelihood.
        """
        if self.trace is None:
            raise ValueError("WAIC requires posterior samples.")

        self.compute_log_likelihood()
        return az.waic(self.trace)



[docs]
    def loo(self) -> az.ELPDData:
        """Compute LOO-CV via Pareto-Smoothed Importance Sampling.

        Returns
        -------
        az.ELPDData
            LOO result object.

        Raises
        ------
        ValueError
            If no trace is available.
        """
        if self.trace is None:
            raise ValueError("LOO requires posterior samples.")

        self.compute_log_likelihood()
        return az.loo(self.trace)


    def _get_prior_var_names(self) -> list[str]:
        """Return posterior variable names needed for prior_from_idata transfer.

        Each component overrides this to declare which variables from the
        source posterior it needs.  Called after ``_assign_model_idx``.

        Returns
        -------
        list[str]
            Variable names to request from ``prior_from_idata``.
        """
        return []

    def _assign_model_idx(self, model_idxs: dict[str, int]) -> None:
        """Pre-assign the component's model index without building the PyMC model.

        This mirrors the index-assignment logic inside ``definition()`` so
        that ``_get_prior_var_names()`` can be called *before* the actual
        model is constructed.

        Parameters
        ----------
        model_idxs : dict[str, int]
            Mutable counter dict, same semantics as in ``definition``.
        """
        pass  # Leaf components override this.


[docs]
    def needs_priors(self, *args, **kwargs):
        return False



[docs]
    def is_individual(self, *args, **kwargs):
        return self.pool_type == "individual"


    def __add__(self, other):
        return AdditiveTimeSeries(self, other)

    def __radd__(self, other):
        return AdditiveTimeSeries(other, self)

    def __pow__(self, other):
        return MultiplicativeTimeSeries(self, other)

    def __rpow__(self, other):
        return MultiplicativeTimeSeries(other, self)

    def __mul__(self, other):
        return SimpleMultiplicativeTimeSeries(self, other)

    def __rmul__(self, other):
        return SimpleMultiplicativeTimeSeries(other, self)




[docs]
class CombinedTimeSeries(TimeSeriesModel):
    """Base class for combined time series models.

    This class serves as the foundation for composing multiple time series
    components together. It provides common functionality for combining
    two components (left and right) and propagating method calls to both.

    Parameters
    ----------
    left : TimeSeriesModel | int | float
        The left operand of the combination. Can be a model component
        or a numeric constant.
    right : TimeSeriesModel | int | float
        The right operand of the combination. Can be a model component
        or a numeric constant.

    Attributes
    ----------
    left : TimeSeriesModel | int | float
        The left component of the combination.
    right : TimeSeriesModel | int | float
        The right component of the combination.

    See Also
    --------
    AdditiveTimeSeries : Combines components using addition.
    MultiplicativeTimeSeries : Combines using y = left * (1 + right).
    SimpleMultiplicativeTimeSeries : Combines using y = left * right.
    """


[docs]
    def __init__(self, left, right):
        self.left = left
        self.right = right


    def _get_initval(self, *args, **kwargs):
        left = {}
        right = {}
        if not (type(self.left) is int or type(self.left) is float):
            left = self.left._get_initval(*args, **kwargs)

        if not (type(self.right) is int or type(self.right) is float):
            right = self.right._get_initval(*args, **kwargs)

        return {**left, **right}

    def _plot(self, *args, **kwargs):
        if not (type(self.left) is int or type(self.left) is float):
            self.left._plot(*args, **kwargs)

        if not (type(self.right) is int or type(self.right) is float):
            self.right._plot(*args, **kwargs)


[docs]
    def needs_priors(self, *args, **kwargs):
        left = False
        right = False
        if not (type(self.left) is int or type(self.left) is float):
            left = self.left.needs_priors(*args, **kwargs)

        if not (type(self.right) is int or type(self.right) is float):
            right = self.right.needs_priors(*args, **kwargs)

        return left or right



[docs]
    def is_individual(self, *args, **kwargs):
        left = True
        right = True
        if not (type(self.left) is int or type(self.left) is float):
            left = self.left.is_individual(*args, **kwargs)

        if not (type(self.right) is int or type(self.right) is float):
            right = self.right.is_individual(*args, **kwargs)

        return left and right


    def _get_prior_var_names(self) -> list[str]:
        names: list[str] = []
        if not (type(self.left) is int or type(self.left) is float):
            names.extend(self.left._get_prior_var_names())
        if not (type(self.right) is int or type(self.right) is float):
            names.extend(self.right._get_prior_var_names())
        return names

    def _assign_model_idx(self, model_idxs: dict[str, int]) -> None:
        if not (type(self.left) is int or type(self.left) is float):
            self.left._assign_model_idx(model_idxs)
        if not (type(self.right) is int or type(self.right) is float):
            self.right._assign_model_idx(model_idxs)

    def _get_leaf_components(self) -> list["TimeSeriesModel"]:
        leaves: list["TimeSeriesModel"] = []
        if not (type(self.left) is int or type(self.left) is float):
            leaves.extend(self.left._get_leaf_components())
        if not (type(self.right) is int or type(self.right) is float):
            leaves.extend(self.right._get_leaf_components())
        return leaves




[docs]
class AdditiveTimeSeries(CombinedTimeSeries):
    """Combines two components using addition: y = left + right.

    This class is created when using the ``+`` operator between time series
    components. The resulting model sums the contributions from both
    components.

    Parameters
    ----------
    left : TimeSeriesModel | int | float
        The left operand of the addition.
    right : TimeSeriesModel | int | float
        The right operand of the addition.

    Examples
    --------
    >>> from vangja import LinearTrend, FourierSeasonality
    >>> # Create an additive model with trend + seasonality
    >>> model = LinearTrend() + FourierSeasonality(period=365.25, series_order=10)
    >>> print(model)
    LT(n=25,r=0.8,tm=None) + FS(p=365.25,n=10,tm=None)
    """


[docs]
    def definition(self, *args, **kwargs):
        left = self.left
        if not (type(self.left) is int or type(self.left) is float):
            left = self.left.definition(*args, **kwargs)

        right = self.right
        if not (type(self.right) is int or type(self.right) is float):
            right = self.right.definition(*args, **kwargs)

        return left + right


    def _predict(self, *args, **kwargs):
        left = self.left
        if not (type(self.left) is int or type(self.left) is float):
            left = self.left._predict(*args, **kwargs)

        right = self.right
        if not (type(self.right) is int or type(self.right) is float):
            right = self.right._predict(*args, **kwargs)

        return left + right

    def __str__(self):
        return f"{self.left} + {self.right}"




[docs]
class MultiplicativeTimeSeries(CombinedTimeSeries):
    """Combines two components using y = left * (1 + right).

    This class is created when using the ``**`` operator between time series
    components. This follows the Prophet-style multiplicative seasonality
    where the right component modulates the left component around its value.

    This formulation is useful when the amplitude of seasonality scales
    with the trend level (heteroscedastic seasonal patterns).

    Parameters
    ----------
    left : TimeSeriesModel | int | float
        The base component (typically a trend).
    right : TimeSeriesModel | int | float
        The multiplicative modifier (typically seasonality).

    Examples
    --------
    >>> from vangja import LinearTrend, FourierSeasonality
    >>> # Create a model with multiplicative seasonality
    >>> model = LinearTrend() ** FourierSeasonality(period=365.25, series_order=10)
    >>> print(model)
    LT(n=25,r=0.8,tm=None) * (1 + FS(p=365.25,n=10,tm=None))

    Notes
    -----
    The ``**`` operator was chosen because ``*`` is used for simple
    multiplication of components.
    """


[docs]
    def definition(self, *args, **kwargs):
        left = self.left
        if not (type(self.left) is int or type(self.left) is float):
            left = self.left.definition(*args, **kwargs)

        right = self.right
        if not (type(self.right) is int or type(self.right) is float):
            right = self.right.definition(*args, **kwargs)

        return left * (1 + right)


    def _predict(self, *args, **kwargs):
        left = self.left
        if not (type(self.left) is int or type(self.left) is float):
            left = self.left._predict(*args, **kwargs)

        right = self.right
        if not (type(self.right) is int or type(self.right) is float):
            right = self.right._predict(*args, **kwargs)

        return left * (1 + right)

    def __str__(self):
        left = f"{self.left}"
        if type(self.left) is AdditiveTimeSeries:
            left = f"({self.left})"

        return f"{left} * (1 + {self.right})"




[docs]
class SimpleMultiplicativeTimeSeries(CombinedTimeSeries):
    """Combines two components using simple multiplication: y = left * right.

    This class is created when using the ``*`` operator between time series
    components. The resulting model multiplies the contributions from both
    components directly.

    This is useful for applying scaling factors or when components should
    truly multiply (not modulate around 1).

    Parameters
    ----------
    left : TimeSeriesModel | int | float
        The left operand of the multiplication.
    right : TimeSeriesModel | int | float
        The right operand of the multiplication.

    Examples
    --------
    >>> from vangja import LinearTrend, UniformConstant
    >>> # Create a model with a scaling factor
    >>> model = LinearTrend() * UniformConstant(lower=0.8, upper=1.2)
    >>> print(model)
    LT(n=25,r=0.8,tm=None) * UC(l=0.8,u=1.2,tm=None)
    """


[docs]
    def definition(self, *args, **kwargs):
        left = self.left
        if not (type(self.left) is int or type(self.left) is float):
            left = self.left.definition(*args, **kwargs)

        right = self.right
        if not (type(self.right) is int or type(self.right) is float):
            right = self.right.definition(*args, **kwargs)

        return left * right


    def _predict(self, *args, **kwargs):
        left = self.left
        if not (type(self.left) is int or type(self.left) is float):
            left = self.left._predict(*args, **kwargs)

        right = self.right
        if not (type(self.right) is int or type(self.right) is float):
            right = self.right._predict(*args, **kwargs)

        return left * right

    def __str__(self):
        left = f"{self.left}"
        if type(self.left) is AdditiveTimeSeries:
            left = f"({self.left})"

        right = f"{self.right}"
        if type(self.right) is AdditiveTimeSeries:
            right = f"({self.right})"

        return f"{left} * {right}"