Source code for pypomp.core.results.panel

from dataclasses import dataclass, field
import pandas as pd
import xarray as xr
import numpy as np
import warnings

from .base import BaseResult, PanelPompEstimationTracesMixin, _merge_results
from ...maths import logmeanexp
from ..rw_sigma import RWSigma
from ..learning_rate import LearningRate
from ..parameters import PanelParameters
from ..optimizer import Optimizer, Adam


@dataclass(eq=False)
class PanelPompBaseResult(BaseResult):
    """Base class for PanelPomp results."""

    theta: PanelParameters | None = None
    """The panel parameter object used for the computation."""



[docs]
@dataclass(eq=False)
class PanelPompPFilterResult(PanelPompBaseResult):
    """Result from PanelPomp.pfilter() method."""

    logLiks: xr.DataArray = field(default_factory=lambda: xr.DataArray([]))
    """Log-likelihoods for each parameter set, replicate, and unit."""
    J: int = 0
    """The number of particles used for filtering."""
    reps: int = 1
    """The number of replicates for each parameter set."""
    thresh: float = 0.0
    """The resampling threshold used."""
    CLL_da: xr.DataArray | None = None
    """Conditional log-likelihoods for each unit and time point."""
    ESS_da: xr.DataArray | None = None
    """Effective Sample Size for each unit and time point."""
    filter_mean: xr.DataArray | None = None
    """The mean of the filtering distribution for each state variable."""
    prediction_mean: xr.DataArray | None = None
    """The mean of the predictive distribution for each state variable."""

    def __post_init__(self):
        self.method = "pfilter"

    @property
    def _summary_config(self) -> list[tuple[str, str]]:
        return [
            ("Number of parameter sets", "theta"),
            ("Number of particles (J)", "J"),
            ("Number of replicates", "reps"),
            ("Resampling threshold", "thresh"),
        ]

    def to_dataframe(self, ignore_nan: bool = False) -> pd.DataFrame:
        """Convert panel pfilter result to DataFrame."""
        ll = logmeanexp(self.logLiks.values, axis=-1, ignore_nan=ignore_nan)
        df = (
            pd.DataFrame(ll, columns=self.logLiks.coords["unit"].values)
            .assign(
                theta_idx=lambda x: range(len(x)),
                **{"shared logLik": lambda x: x.sum(axis=1)},
            )
            .melt(
                id_vars=["theta_idx", "shared logLik"],
                var_name="unit",
                value_name="unit logLik",
            )
        )

        if self.theta is not None:
            shared = [
                t.get("shared")
                for t in self.theta._theta
                if t.get("shared") is not None
            ]
            if shared:
                df = df.join(
                    pd.concat(shared, axis=1).T.reset_index(drop=True), on="theta_idx"
                )
            unit_spec = [
                t.get("unit_specific")
                for t in self.theta._theta
                if t.get("unit_specific") is not None
            ]
            if unit_spec:
                u_params = (
                    pd.concat(unit_spec, keys=range(len(unit_spec)))
                    .stack()
                    .unstack(level=1)
                    .reset_index()
                )
                u_params.columns = ["theta_idx", "unit"] + list(u_params.columns[2:])
                df = df.merge(u_params, on=["theta_idx", "unit"], how="left")
        return df

    def CLL(self, average: bool = False) -> pd.DataFrame:
        """Return conditional log-likelihoods as a DataFrame."""
        if self.CLL_da is None or self.CLL_da.size == 0:
            return pd.DataFrame()
        if not average:
            return self.CLL_da.to_dataframe(name="CLL").reset_index()
        avg = logmeanexp(np.asarray(self.CLL_da.values), axis=2)
        return (
            xr.DataArray(
                avg,
                dims=["theta_idx", "unit", "time"],
                coords={
                    "theta_idx": self.CLL_da.coords.get(
                        "theta_idx", np.arange(avg.shape[0])
                    ),
                    "unit": self.CLL_da.coords["unit"].values,
                    "time": self.CLL_da.coords.get("time", np.arange(avg.shape[2])),
                },
            )
            .to_dataframe(name="CLL")
            .reset_index()
        )

    def ESS(self, average: bool = False) -> pd.DataFrame:
        """Return Effective Sample Size as a DataFrame."""
        if self.ESS_da is None or self.ESS_da.size == 0:
            return pd.DataFrame()
        ess = self.ESS_da.mean(dim="rep") if average else self.ESS_da
        return ess.to_dataframe(name="ESS").reset_index()

    def traces(self) -> pd.DataFrame:
        """Return pfilter results formatted as traces (long format)."""
        ll = logmeanexp(self.logLiks.values, axis=-1)
        reps = np.arange(len(ll))
        df_s = pd.DataFrame(
            {"theta_idx": reps, "unit": "shared", "logLik": ll.sum(axis=1)}
        )
        df_u = (
            pd.DataFrame(ll, columns=self.logLiks.coords["unit"].values, index=reps)
            .melt(ignore_index=False, var_name="unit", value_name="logLik")
            .reset_index()
            .rename(columns={"index": "theta_idx"})
        )

        if self.theta is not None:
            shared = [
                t.get("shared")
                for t in self.theta._theta
                if t.get("shared") is not None
            ]
            if shared:
                p_s = pd.concat(shared, axis=1).T.set_axis(reps, axis=0)
                df_s, df_u = (
                    df_s.join(p_s, on="theta_idx"),
                    df_u.join(p_s, on="theta_idx"),
                )
            unit_spec = [
                t.get("unit_specific")
                for t in self.theta._theta
                if t.get("unit_specific") is not None
            ]
            if unit_spec:
                p_u = pd.concat(unit_spec, keys=reps).stack().unstack(level=1)
                p_u.index.names = ["theta_idx", "unit"]
                df_u = df_u.join(p_u, on=["theta_idx", "unit"])
        dfs_to_concat = [df for df in [df_s, df_u] if not df.empty]
        if not dfs_to_concat:
            return pd.DataFrame()

        all_cols = dfs_to_concat[0].columns
        for df in dfs_to_concat[1:]:
            all_cols = all_cols.union(df.columns)

        with warnings.catch_warnings():
            warnings.filterwarnings("ignore", category=FutureWarning)
            df = pd.concat(dfs_to_concat, ignore_index=True)
        df = df.assign(method="pfilter", iteration=0)
        cols = ["theta_idx", "unit", "iteration", "method", "logLik"]
        other_cols = [c for c in df.columns if c not in cols]
        return df[cols + other_cols]

    @staticmethod
    def merge(*results: "PanelPompPFilterResult") -> "PanelPompPFilterResult":
        return _merge_results(
            PanelPompPFilterResult,
            results,
            ["J", "reps", "thresh", "method"],
            ["logLiks", "CLL_da", "ESS_da", "filter_mean", "prediction_mean"],
        )




[docs]
@dataclass(eq=False)
class PanelPompMIFResult(PanelPompEstimationTracesMixin, PanelPompBaseResult):
    """Result from PanelPomp.mif() method."""

    shared_traces: xr.DataArray = field(default_factory=lambda: xr.DataArray([]))
    """Shared parameter traces across iterations."""
    unit_traces: xr.DataArray = field(default_factory=lambda: xr.DataArray([]))
    """Unit-specific parameter traces across iterations."""
    logLiks: xr.DataArray = field(default_factory=lambda: xr.DataArray([]))
    """Log-likelihoods for each unit across iterations."""
    J: int = 0
    """The number of particles used for filtering."""
    M: int = 0
    """The number of iterations performed."""
    rw_sd: RWSigma | None = None
    """The random walk standard deviations for parameter perturbation."""
    a: float = 0.0
    """The cooling fraction used."""
    thresh: float = 0.0
    """The resampling threshold used."""
    n_monitors: int = 0
    """The number of particle filters used to estimate log-likelihoods at each iteration."""
    block: bool = False
    """Whether block-style filtering was used."""

    def __post_init__(self):
        self.method = "mif"

    @property
    def _summary_config(self) -> list[tuple[str, str]]:
        return [
            ("Number of parameter sets", "theta"),
            ("Number of particles (J)", "J"),
            ("Number of iterations (M)", "M"),
            ("Cooling fraction (a)", "a"),
            ("Resampling threshold", "thresh"),
            ("Number of monitors", "n_monitors"),
            ("Block", "block"),
        ]

    @staticmethod
    def merge(*results: "PanelPompMIFResult") -> "PanelPompMIFResult":
        return _merge_results(
            PanelPompMIFResult,
            results,
            ["J", "M", "a", "thresh", "n_monitors", "block", "rw_sd", "method"],
            ["shared_traces", "unit_traces", "logLiks"],
        )




[docs]
@dataclass(eq=False)
class PanelPompTrainResult(PanelPompEstimationTracesMixin, PanelPompBaseResult):
    """Result from PanelPomp.train() method."""

    shared_traces: xr.DataArray = field(default_factory=lambda: xr.DataArray([]))
    """Shared parameter traces across iterations."""
    unit_traces: xr.DataArray = field(default_factory=lambda: xr.DataArray([]))
    """Unit-specific parameter traces across iterations."""
    logLiks: xr.DataArray = field(default_factory=lambda: xr.DataArray([]))
    """Log-likelihoods for each unit across iterations."""
    optimizer: Optimizer = field(default_factory=Adam)
    """The optimizer used for training."""
    J: int = 0
    """The number of particles used for filtering."""
    M: int = 0
    """The number of iterations performed."""
    eta: LearningRate | None = None
    """The learning rate object."""
    alpha: float = 0.97
    """The discount factor for the gradient moving average."""
    alpha_cooling: float = 1.0
    """The cooling factor for the discount factor."""

    def __post_init__(self):
        self.method = "train"

    @property
    def _summary_config(self) -> list[tuple[str, str]]:
        return [
            ("Number of parameter sets", "theta"),
            ("Optimizer", "optimizer"),
            ("Number of particles (J)", "J"),
            ("Number of iterations (M)", "M"),
            ("Learning rate (eta)", "eta"),
            ("Discount factor (alpha)", "alpha"),
            ("Cooling factor for alpha", "alpha_cooling"),
        ]

    @staticmethod
    def merge(*results: "PanelPompTrainResult") -> "PanelPompTrainResult":
        return _merge_results(
            PanelPompTrainResult,
            results,
            ["optimizer", "J", "M", "eta", "alpha", "alpha_cooling", "method"],
            ["shared_traces", "unit_traces", "logLiks"],
        )