Source code for causalpy.checks.prior_sensitivity

#   Copyright 2022 - 2026 The PyMC Labs Developers
#
#   Licensed under the Apache License, Version 2.0 (the "License");
#   you may not use this file except in compliance with the License.
#   You may obtain a copy of the License at
#
#       http://www.apache.org/licenses/LICENSE-2.0
#
#   Unless required by applicable law or agreed to in writing, software
#   distributed under the License is distributed on an "AS IS" BASIS,
#   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#   See the License for the specific language governing permissions and
#   limitations under the License.
"""
Prior sensitivity check for Bayesian causal inference experiments.

Re-fits the experiment with alternative prior specifications and
compares posterior estimates to assess how sensitive the conclusions
are to prior choices.
"""

from __future__ import annotations

import logging
from typing import Any

import matplotlib.pyplot as plt
import pandas as pd

from causalpy.checks._plot_helpers import forest_plot
from causalpy.checks.base import CheckResult, clone_model
from causalpy.experiments.base import BaseExperiment
from causalpy.experiments.diff_in_diff import DifferenceInDifferences
from causalpy.experiments.instrumental_variable import InstrumentalVariable
from causalpy.experiments.interrupted_time_series import InterruptedTimeSeries
from causalpy.experiments.inverse_propensity_weighting import (
    InversePropensityWeighting,
)
from causalpy.experiments.prepostnegd import PrePostNEGD
from causalpy.experiments.regression_discontinuity import RegressionDiscontinuity
from causalpy.experiments.regression_kink import RegressionKink
from causalpy.experiments.staggered_did import StaggeredDifferenceInDifferences
from causalpy.experiments.synthetic_control import SyntheticControl
from causalpy.pipeline import PipelineContext
from causalpy.pymc_models import PyMCModel

logger = logging.getLogger(__name__)



[docs]
class PriorSensitivity:
    """Re-fit the experiment with alternative models/priors and compare.

    Each alternative is specified as a dict with ``"name"`` and ``"model"``
    keys.  The check re-instantiates the experiment for each alternative
    model and compares the resulting effect summaries.

    Parameters
    ----------
    alternatives : list of dict
        Each dict must have ``"name"`` (str) and ``"model"`` (PyMCModel
        or RegressorMixin) keys.

    Examples
    --------
    >>> import causalpy as cp  # doctest: +SKIP
    >>> check = cp.checks.PriorSensitivity(  # doctest: +SKIP
    ...     alternatives=[
    ...         {"name": "diffuse", "model": cp.pymc_models.LinearRegression(...)},
    ...         {"name": "tight", "model": cp.pymc_models.LinearRegression(...)},
    ...     ]
    ... )
    """

    applicable_methods: set[type[BaseExperiment]] = {
        InterruptedTimeSeries,
        DifferenceInDifferences,
        SyntheticControl,
        StaggeredDifferenceInDifferences,
        RegressionDiscontinuity,
        RegressionKink,
        PrePostNEGD,
        InversePropensityWeighting,
        InstrumentalVariable,
    }


[docs]
    @staticmethod
    def plot(
        result: CheckResult,
        *,
        baseline_stats: Any | None = None,
        baseline_label: str = "baseline",
        figsize: tuple[float, float] | None = None,
    ) -> tuple[plt.Figure, plt.Axes]:
        """Forest plot of effect estimates under alternative priors.

        Parameters
        ----------
        result : CheckResult
            The ``CheckResult`` returned by :meth:`run`.
        baseline_stats : EffectSummary, optional
            The original experiment's ``effect_summary()``.  When provided
            a baseline row is prepended.
        baseline_label : str
            Label for the baseline row.
        figsize : tuple, optional
            Passed to matplotlib.

        Returns
        -------
        tuple[plt.Figure, plt.Axes]
        """
        baseline_row = None
        if baseline_stats is not None and baseline_stats.table is not None:
            tbl = baseline_stats.table
            baseline_row = {
                "mean": tbl["mean"].iloc[0],
                "hdi_lower": tbl["hdi_lower"].iloc[0],
                "hdi_upper": tbl["hdi_upper"].iloc[0],
            }

        if result.table is None:
            raise ValueError("Cannot plot: CheckResult has no table.")

        return forest_plot(
            result.table,
            label_col="prior_spec",
            baseline_row=baseline_row,
            baseline_label=baseline_label,
            xlabel="Average causal impact",
            title="Prior sensitivity: effect estimates under different priors",
            figsize=figsize,
            baseline_color="C0",
            comparison_color="C1",
        )



[docs]
    def __init__(self, alternatives: list[dict[str, Any]]) -> None:
        if not alternatives:
            raise ValueError("alternatives must be a non-empty list")
        for i, alt in enumerate(alternatives):
            if "name" not in alt or "model" not in alt:
                raise ValueError(
                    f"Alternative {i} must have 'name' and 'model' keys, "
                    f"got keys: {list(alt.keys())}"
                )
        self.alternatives = alternatives



[docs]
    def validate(self, experiment: BaseExperiment) -> None:
        """Verify the experiment uses a Bayesian (PyMC) model."""
        if not isinstance(experiment.model, PyMCModel):
            raise TypeError(
                "PriorSensitivity requires a Bayesian (PyMC) model. "
                f"Got {type(experiment.model).__name__}."
            )



[docs]
    def run(
        self,
        experiment: BaseExperiment,
        context: PipelineContext,
    ) -> CheckResult:
        """Re-fit with each alternative model and compare effect estimates."""
        if context.experiment_config is None:
            raise RuntimeError(
                "No experiment_config in context. Use EstimateEffect "
                "before SensitivityAnalysis."
            )

        method = context.experiment_config["method"]
        base_kwargs = {
            k: v
            for k, v in context.experiment_config.items()
            if k not in ("method", "model")
        }

        rows: list[dict[str, Any]] = []

        for alt in self.alternatives:
            name = alt["name"]
            model = clone_model(alt["model"])
            logger.info("PriorSensitivity: fitting with '%s'", name)

            alt_experiment = method(context.data, model=model, **base_kwargs)

            try:
                summary = alt_experiment.effect_summary()
                row: dict[str, Any] = {"prior_spec": name}
                if summary.table is not None and not summary.table.empty:
                    for col in summary.table.columns:
                        row[col] = summary.table[col].iloc[0]
                rows.append(row)
            except (NotImplementedError, Exception) as exc:
                logger.warning(
                    "PriorSensitivity: effect_summary() failed for '%s': %s",
                    name,
                    exc,
                )
                rows.append({"prior_spec": name, "error": str(exc)})

        table = pd.DataFrame(rows) if rows else None

        text = (
            f"Prior sensitivity analysis: compared {len(self.alternatives)} "
            f"alternative prior specifications."
        )

        baseline_stats = experiment.effect_summary()

        check_result = CheckResult(
            check_name="PriorSensitivity",
            passed=None,
            table=table,
            text=text,
        )

        if table is not None and not table.empty:
            try:
                fig, _ = self.plot(check_result, baseline_stats=baseline_stats)
                check_result.figures = [fig]
            except Exception:
                logger.debug(
                    "PriorSensitivity: could not generate figure", exc_info=True
                )

        return check_result