From 7962b50909511e7c86ba3e405f3802c6dc6a8d80 Mon Sep 17 00:00:00 2001
From: juanitorduz <juanitorduz@gmail.com>
Date: Wed, 12 Nov 2025 11:41:58 +0100
Subject: [PATCH 1/6] init

---
 causalpy/data/simulate_data.py                |  33 ++---
 causalpy/experiments/base.py                  |  24 ++--
 causalpy/experiments/diff_in_diff.py          |  31 ++--
 causalpy/experiments/instrumental_variable.py |  20 +--
 .../experiments/interrupted_time_series.py    |  18 ++-
 .../inverse_propensity_weighting.py           |  55 ++++---
 causalpy/experiments/prepostnegd.py           |  12 +-
 .../experiments/regression_discontinuity.py   |  24 ++--
 causalpy/experiments/regression_kink.py       |  35 +++--
 causalpy/experiments/synthetic_control.py     |  38 +++--
 causalpy/plot_utils.py                        |   6 +-
 causalpy/pymc_models.py                       | 135 ++++++++++++------
 causalpy/skl_models.py                        |  26 ++--
 causalpy/utils.py                             |   8 +-
 docs/source/_static/interrogate_badge.svg     |   6 +-
 15 files changed, 295 insertions(+), 176 deletions(-)

diff --git a/causalpy/data/simulate_data.py b/causalpy/data/simulate_data.py
index e40822e6..ae705059 100644
--- a/causalpy/data/simulate_data.py
+++ b/causalpy/data/simulate_data.py
@@ -31,7 +31,7 @@ def _smoothed_gaussian_random_walk(
     gaussian_random_walk_mu: float,
     gaussian_random_walk_sigma: float,
     N: int,
-    lowess_kwargs: dict[str, Any],
+    lowess_kwargs: dict,
 ) -> tuple[np.ndarray, np.ndarray]:
     """
     Generates Gaussian random walk data and applies LOWESS.
@@ -57,7 +57,7 @@ def generate_synthetic_control_data(
     treatment_time: int = 70,
     grw_mu: float = 0.25,
     grw_sigma: float = 1,
-    lowess_kwargs: dict[str, Any] | None = None,
+    lowess_kwargs: dict = default_lowess_kwargs,
 ) -> tuple[pd.DataFrame, np.ndarray]:
     """
     Generates data for synthetic control example.
@@ -78,9 +78,6 @@ def generate_synthetic_control_data(
     >>> from causalpy.data.simulate_data import generate_synthetic_control_data
     >>> df, weightings_true = generate_synthetic_control_data(treatment_time=70)
     """
-    if lowess_kwargs is None:
-        lowess_kwargs = default_lowess_kwargs
-
     # 1. Generate non-treated variables
     df = pd.DataFrame(
         {
@@ -166,7 +163,9 @@ def generate_time_series_data(
     return df
 
 
-def generate_time_series_data_seasonal(treatment_time: pd.Timestamp) -> pd.DataFrame:
+def generate_time_series_data_seasonal(
+    treatment_time: pd.Timestamp,
+) -> pd.DataFrame:
     """
     Generates 10 years of monthly data with seasonality
     """
@@ -184,7 +183,9 @@ def generate_time_series_data_seasonal(treatment_time: pd.Timestamp) -> pd.DataF
 
     N = df.shape[0]
     idx = np.arange(N)[df.index > treatment_time]
-    df["causal effect"] = 100 * gamma(10).pdf(np.arange(0, N, 1) - np.min(idx))
+    df["causal effect"] = 100 * gamma(10).pdf(
+        np.array(np.arange(0, N, 1)) - int(np.min(idx))
+    )
 
     df["y"] += df["causal effect"]
     df["y"] += norm(0, 2).rvs(N)
@@ -310,8 +311,8 @@ def impact(x: np.ndarray) -> np.ndarray:
 def generate_ancova_data(
     N: int = 200,
     pre_treatment_means: np.ndarray = np.array([10, 12]),
-    treatment_effect: float = 2,
-    sigma: float = 1,
+    treatment_effect: int = 2,
+    sigma: int = 1,
 ) -> pd.DataFrame:
     """
     Generate ANCOVA example data
@@ -445,7 +446,7 @@ def generate_multicell_geolift_data() -> pd.DataFrame:
 
 
 def generate_seasonality(
-    n: int = 12, amplitude: float = 1, length_scale: float = 0.5
+    n: int = 12, amplitude: int = 1, length_scale: float = 0.5
 ) -> np.ndarray:
     """Generate monthly seasonality by sampling from a Gaussian process with a
     Gaussian kernel, using numpy code"""
@@ -463,9 +464,9 @@ def generate_seasonality(
 def periodic_kernel(
     x1: np.ndarray,
     x2: np.ndarray,
-    period: float = 1,
-    length_scale: float = 1,
-    amplitude: float = 1,
+    period: int = 1,
+    length_scale: float = 1.0,
+    amplitude: int = 1,
 ) -> np.ndarray:
     """Generate a periodic kernel for gaussian process"""
     return amplitude**2 * np.exp(
@@ -475,10 +476,10 @@ def periodic_kernel(
 
 def create_series(
     n: int = 52,
-    amplitude: float = 1,
-    length_scale: float = 2,
+    amplitude: int = 1,
+    length_scale: int = 2,
     n_years: int = 4,
-    intercept: float = 3,
+    intercept: int = 3,
 ) -> np.ndarray:
     """
     Returns numpy tile with generated seasonality data repeated over
diff --git a/causalpy/experiments/base.py b/causalpy/experiments/base.py
index f24cc69a..9f0b26ac 100644
--- a/causalpy/experiments/base.py
+++ b/causalpy/experiments/base.py
@@ -16,6 +16,7 @@
 """
 
 from abc import abstractmethod
+from typing import Any, Union
 
 import arviz as az
 import matplotlib.pyplot as plt
@@ -29,10 +30,12 @@
 class BaseExperiment:
     """Base class for quasi experimental designs."""
 
+    labels: list[str]
+
     supports_bayes: bool
     supports_ols: bool
 
-    def __init__(self, model=None):
+    def __init__(self, model: Union[PyMCModel, RegressorMixin] | None = None) -> None:
         # Ensure we've made any provided Scikit Learn model (as identified as being type
         # RegressorMixin) compatible with CausalPy by appending our custom methods.
         if isinstance(model, RegressorMixin):
@@ -50,16 +53,19 @@ def __init__(self, model=None):
         if self.model is None:
             raise ValueError("model not set or passed.")
 
+    def fit(self, *args: Any, **kwargs: Any) -> None:
+        raise NotImplementedError("fit method not implemented")
+
     @property
-    def idata(self):
+    def idata(self) -> az.InferenceData:
         """Return the InferenceData object of the model. Only relevant for PyMC models."""
         return self.model.idata
 
-    def print_coefficients(self, round_to=None):
+    def print_coefficients(self, round_to: int | None = None) -> None:
         """Ask the model to print its coefficients."""
         self.model.print_coefficients(self.labels, round_to)
 
-    def plot(self, *args, **kwargs) -> tuple:
+    def plot(self, *args: Any, **kwargs: Any) -> tuple:
         """Plot the model.
 
         Internally, this function dispatches to either `_bayesian_plot` or `_ols_plot`
@@ -75,16 +81,16 @@ def plot(self, *args, **kwargs) -> tuple:
                 raise ValueError("Unsupported model type")
 
     @abstractmethod
-    def _bayesian_plot(self, *args, **kwargs):
+    def _bayesian_plot(self, *args: Any, **kwargs: Any) -> tuple:
         """Abstract method for plotting the model."""
         raise NotImplementedError("_bayesian_plot method not yet implemented")
 
     @abstractmethod
-    def _ols_plot(self, *args, **kwargs):
+    def _ols_plot(self, *args: Any, **kwargs: Any) -> tuple:
         """Abstract method for plotting the model."""
         raise NotImplementedError("_ols_plot method not yet implemented")
 
-    def get_plot_data(self, *args, **kwargs) -> pd.DataFrame:
+    def get_plot_data(self, *args: Any, **kwargs: Any) -> pd.DataFrame:
         """Recover the data of an experiment along with the prediction and causal impact information.
 
         Internally, this function dispatches to either :func:`get_plot_data_bayesian` or :func:`get_plot_data_ols`
@@ -98,11 +104,11 @@ def get_plot_data(self, *args, **kwargs) -> pd.DataFrame:
             raise ValueError("Unsupported model type")
 
     @abstractmethod
-    def get_plot_data_bayesian(self, *args, **kwargs):
+    def get_plot_data_bayesian(self, *args: Any, **kwargs: Any) -> pd.DataFrame:
         """Abstract method for recovering plot data."""
         raise NotImplementedError("get_plot_data_bayesian method not yet implemented")
 
     @abstractmethod
-    def get_plot_data_ols(self, *args, **kwargs):
+    def get_plot_data_ols(self, *args: Any, **kwargs: Any) -> pd.DataFrame:
         """Abstract method for recovering plot data."""
         raise NotImplementedError("get_plot_data_ols method not yet implemented")
diff --git a/causalpy/experiments/diff_in_diff.py b/causalpy/experiments/diff_in_diff.py
index a21abd94..f0dd87ad 100644
--- a/causalpy/experiments/diff_in_diff.py
+++ b/causalpy/experiments/diff_in_diff.py
@@ -15,6 +15,8 @@
 Difference in differences
 """
 
+from typing import Union
+
 import arviz as az
 import numpy as np
 import pandas as pd
@@ -92,8 +94,8 @@ def __init__(
         time_variable_name: str,
         group_variable_name: str,
         post_treatment_variable_name: str = "post_treatment",
-        model=None,
-        **kwargs,
+        model: Union[PyMCModel, RegressorMixin] | None = None,
+        **kwargs: dict,
     ) -> None:
         super().__init__(model=model)
         self.causal_impact: xr.DataArray | float | None
@@ -234,14 +236,14 @@ def __init__(
                 f"{self.group_variable_name}:{self.post_treatment_variable_name}"
             )
             matched_key = next((k for k in coef_map if interaction_term in k), None)
-            att = coef_map.get(matched_key)
+            att = coef_map.get(matched_key) if matched_key is not None else None
             self.causal_impact = att
         else:
             raise ValueError("Model type not recognized")
 
         return
 
-    def input_validation(self):
+    def input_validation(self) -> None:
         # Validate formula structure and interaction interaction terms
         self._validate_formula_interaction_terms()
 
@@ -269,7 +271,7 @@ def input_validation(self):
                 coded. Consisting of 0's and 1's only."""
             )
 
-    def _validate_formula_interaction_terms(self):
+    def _validate_formula_interaction_terms(self) -> None:
         """
         Validate that the formula contains at most one interaction term and no three-way or higher-order interactions.
         Raises FormulaException if more than one interaction term is found or if any interaction term has more than 2 variables.
@@ -299,7 +301,7 @@ def _validate_formula_interaction_terms(self):
                 "Multiple interaction terms are not currently supported as they complicate interpretation of the causal effect."
             )
 
-    def summary(self, round_to=None) -> None:
+    def summary(self, round_to: int | None = 2) -> None:
         """Print summary of main results and model coefficients.
 
         :param round_to:
@@ -311,11 +313,13 @@ def summary(self, round_to=None) -> None:
         print(self._causal_impact_summary_stat(round_to))
         self.print_coefficients(round_to)
 
-    def _causal_impact_summary_stat(self, round_to=None) -> str:
+    def _causal_impact_summary_stat(self, round_to: int | None = None) -> str:
         """Computes the mean and 94% credible interval bounds for the causal impact."""
         return f"Causal impact = {convert_to_string(self.causal_impact, round_to=round_to)}"
 
-    def _bayesian_plot(self, round_to=None, **kwargs) -> tuple[plt.Figure, plt.Axes]:
+    def _bayesian_plot(
+        self, round_to: int | None = None, **kwargs: dict
+    ) -> tuple[plt.Figure, plt.Axes]:
         """
         Plot the results
 
@@ -463,9 +467,10 @@ def _plot_causal_impact_arrow(results, ax):
         )
         return fig, ax
 
-    def _ols_plot(self, round_to=None, **kwargs) -> tuple[plt.Figure, plt.Axes]:
+    def _ols_plot(
+        self, round_to: int | None = 2, **kwargs: dict
+    ) -> tuple[plt.Figure, plt.Axes]:
         """Generate plot for difference-in-differences"""
-        round_to = kwargs.get("round_to")
         fig, ax = plt.subplots()
 
         # Plot raw data
@@ -528,11 +533,15 @@ def _ols_plot(self, round_to=None, **kwargs) -> tuple[plt.Figure, plt.Axes]:
             va="center",
         )
         # formatting
+        # In OLS context, causal_impact should be a float, but mypy doesn't know this
+        causal_impact_value = (
+            float(self.causal_impact) if self.causal_impact is not None else 0.0
+        )
         ax.set(
             xlim=[-0.05, 1.1],
             xticks=[0, 1],
             xticklabels=["pre", "post"],
-            title=f"Causal impact = {round_num(self.causal_impact, round_to)}",
+            title=f"Causal impact = {round_num(causal_impact_value, round_to)}",
         )
         ax.legend(fontsize=LEGEND_FONT_SIZE)
         return fig, ax
diff --git a/causalpy/experiments/instrumental_variable.py b/causalpy/experiments/instrumental_variable.py
index 001ce9af..b7cbd737 100644
--- a/causalpy/experiments/instrumental_variable.py
+++ b/causalpy/experiments/instrumental_variable.py
@@ -97,10 +97,10 @@ def __init__(
         data: pd.DataFrame,
         instruments_formula: str,
         formula: str,
-        model=None,
-        priors=None,
-        **kwargs,
-    ):
+        model: BaseExperiment | None = None,
+        priors: dict | None = None,
+        **kwargs: dict,
+    ) -> None:
         super().__init__(model=model)
         self.expt_type = "Instrumental Variable Regression"
         self.data = data
@@ -138,11 +138,11 @@ def __init__(
                 "lkj_sd": 1,
             }
         self.priors = priors
-        self.model.fit(
+        self.model.fit(  # type: ignore[call-arg,union-attr]
             X=self.X, Z=self.Z, y=self.y, t=self.t, coords=COORDS, priors=self.priors
         )
 
-    def input_validation(self):
+    def input_validation(self) -> None:
         """Validate the input data and model formula for correctness"""
         treatment = self.instruments_formula.split("~")[0]
         test = treatment.strip() in self.instruments_data.columns
@@ -165,7 +165,7 @@ def input_validation(self):
                 The coefficients should be interpreted appropriately."""
             )
 
-    def get_2SLS_fit(self):
+    def get_2SLS_fit(self) -> None:
         """
         Two Stage Least Squares Fit
 
@@ -187,7 +187,7 @@ def get_2SLS_fit(self):
         self.first_stage_reg = first_stage_reg
         self.second_stage_reg = second_stage_reg
 
-    def get_naive_OLS_fit(self):
+    def get_naive_OLS_fit(self) -> None:
         """
         Naive Ordinary Least Squares
 
@@ -199,7 +199,7 @@ def get_naive_OLS_fit(self):
         self.ols_beta_params = dict(zip(self._x_design_info.column_names, beta_params))
         self.ols_reg = ols_reg
 
-    def plot(self, round_to=None):
+    def plot(self, *args, **kwargs) -> None:  # type: ignore[override]
         """
         Plot the results
 
@@ -208,7 +208,7 @@ def plot(self, round_to=None):
         """
         raise NotImplementedError("Plot method not implemented.")
 
-    def summary(self, round_to=None) -> None:
+    def summary(self, round_to: int | None = None) -> None:
         """Print summary of main results and model coefficients.
 
         :param round_to:
diff --git a/causalpy/experiments/interrupted_time_series.py b/causalpy/experiments/interrupted_time_series.py
index b60e452d..25ff1932 100644
--- a/causalpy/experiments/interrupted_time_series.py
+++ b/causalpy/experiments/interrupted_time_series.py
@@ -89,8 +89,8 @@ def __init__(
         data: pd.DataFrame,
         treatment_time: Union[int, float, pd.Timestamp],
         formula: str,
-        model=None,
-        **kwargs,
+        model: Union[PyMCModel, RegressorMixin] | None = None,
+        **kwargs: dict,
     ) -> None:
         super().__init__(model=model)
         self.pre_y: xr.DataArray
@@ -189,7 +189,9 @@ def __init__(
             self.post_impact
         )
 
-    def input_validation(self, data, treatment_time):
+    def input_validation(
+        self, data: pd.DataFrame, treatment_time: Union[int, float, pd.Timestamp]
+    ) -> None:
         """Validate the input data and model formula for correctness"""
         if isinstance(data.index, pd.DatetimeIndex) and not isinstance(
             treatment_time, pd.Timestamp
@@ -204,7 +206,7 @@ def input_validation(self, data, treatment_time):
                 "If data.index is not DatetimeIndex, treatment_time must be pd.Timestamp."  # noqa: E501
             )
 
-    def summary(self, round_to=None) -> None:
+    def summary(self, round_to: int | None = None) -> None:
         """Print summary of main results and model coefficients.
 
         :param round_to:
@@ -215,7 +217,7 @@ def summary(self, round_to=None) -> None:
         self.print_coefficients(round_to)
 
     def _bayesian_plot(
-        self, round_to=None, **kwargs
+        self, round_to: int | None = 2, **kwargs: dict
     ) -> tuple[plt.Figure, List[plt.Axes]]:
         """
         Plot the results
@@ -340,7 +342,9 @@ def _bayesian_plot(
 
         return fig, ax
 
-    def _ols_plot(self, round_to=None, **kwargs) -> tuple[plt.Figure, List[plt.Axes]]:
+    def _ols_plot(
+        self, round_to: int | None = 2, **kwargs: dict
+    ) -> tuple[plt.Figure, List[plt.Axes]]:
         """
         Plot the results
 
@@ -363,7 +367,7 @@ def _ols_plot(self, round_to=None, **kwargs) -> tuple[plt.Figure, List[plt.Axes]
             c="k",
         )
         ax[0].set(
-            title=f"$R^2$ on pre-intervention data = {round_num(self.score, round_to)}"
+            title=f"$R^2$ on pre-intervention data = {round_num(float(self.score), round_to)}"
         )
 
         ax[1].plot(self.datapre.index, self.pre_impact, "k.")
diff --git a/causalpy/experiments/inverse_propensity_weighting.py b/causalpy/experiments/inverse_propensity_weighting.py
index 1a04c070..99cbe7c0 100644
--- a/causalpy/experiments/inverse_propensity_weighting.py
+++ b/causalpy/experiments/inverse_propensity_weighting.py
@@ -78,9 +78,9 @@ def __init__(
         formula: str,
         outcome_variable: str,
         weighting_scheme: str,
-        model=None,
-        **kwargs,
-    ):
+        model: BaseExperiment | None = None,
+        **kwargs: dict,
+    ) -> None:
         super().__init__(model=model)
         self.expt_type = "Inverse Propensity Score Weighting"
         self.data = data
@@ -98,12 +98,12 @@ def __init__(
 
         COORDS = {"obs_ind": list(range(self.X.shape[0])), "coeffs": self.labels}
         self.coords = COORDS
-        self.X_outcome = pd.DataFrame(self.X, columns=self.coords["coeffs"])
+        self.X_outcome = pd.DataFrame(self.X, columns=self.labels)
         self.X_outcome["trt"] = self.t
         self.coords["outcome_coeffs"] = self.X_outcome.columns
-        self.model.fit(X=self.X, t=self.t, coords=COORDS)
+        self.model.fit(X=self.X, t=self.t, coords=COORDS)  # type: ignore[call-arg]
 
-    def input_validation(self):
+    def input_validation(self) -> None:
         """Validate the input data and model formula for correctness"""
         treatment = self.formula.split("~")[0]
         test = treatment.strip() in self.data.columns
@@ -125,7 +125,9 @@ def input_validation(self):
                 """
             )
 
-    def make_robust_adjustments(self, ps):
+    def make_robust_adjustments(
+        self, ps: np.ndarray
+    ) -> tuple[pd.Series, pd.Series, int, int]:
         """This estimator is discussed in Aronow
         and Miller's book as being related to the
         Horvitz Thompson method"""
@@ -145,7 +147,9 @@ def make_robust_adjustments(self, ps):
         weighted_outcome0 = outcome_ntrt * i_propensity0
         return weighted_outcome0, weighted_outcome1, n_ntrt, n_trt
 
-    def make_raw_adjustments(self, ps):
+    def make_raw_adjustments(
+        self, ps: np.ndarray
+    ) -> tuple[pd.Series, pd.Series, int, int]:
         """This estimator is discussed in Aronow and
         Miller as the simplest of base form of
         inverse propensity weighting schemes"""
@@ -164,7 +168,9 @@ def make_raw_adjustments(self, ps):
         weighted_outcome0 = outcome_ntrt * i_propensity0
         return weighted_outcome0, weighted_outcome1, n_ntrt, n_trt
 
-    def make_overlap_adjustments(self, ps):
+    def make_overlap_adjustments(
+        self, ps: np.ndarray
+    ) -> tuple[pd.Series, pd.Series, pd.Series, pd.Series]:
         """This weighting scheme was adapted from
         Lucy D’Agostino McGowan's blog on
         Propensity Score Weights referenced in
@@ -184,7 +190,9 @@ def make_overlap_adjustments(self, ps):
         weighted_outcome0 = (1 - t[t == 0]) * outcome_ntrt * i_propensity0
         return weighted_outcome0, weighted_outcome1, n_ntrt, n_trt
 
-    def make_doubly_robust_adjustment(self, ps):
+    def make_doubly_robust_adjustment(
+        self, ps: np.ndarray
+    ) -> tuple[pd.Series, pd.Series, None, None]:
         """The doubly robust weighting scheme is also
         discussed in Aronow and Miller, but a bit more generally
         than our implementation here. Here we have specified
@@ -203,7 +211,9 @@ def make_doubly_robust_adjustment(self, ps):
         weighted_outcome1 = t * (self.y - m1_pred) / X["ps"] + m1_pred
         return weighted_outcome0, weighted_outcome1, None, None
 
-    def get_ate(self, i, idata, method="doubly_robust"):
+    def get_ate(
+        self, i: int, idata: az.InferenceData, method: str = "doubly_robust"
+    ) -> list[float]:
         ### Post processing the sample posterior distribution for propensity scores
         ### One sample at a time.
         ps = idata["posterior"]["p"].stack(z=("chain", "draw"))[:, i].values
@@ -231,23 +241,27 @@ def get_ate(self, i, idata, method="doubly_robust"):
                 weighted_outcome_trt,
                 n_ntrt,
                 n_trt,
-            ) = self.make_overlap_adjustments(ps)
-            ntrt = np.sum(weighted_outcome_ntrt) / np.sum(n_ntrt)
-            trt = np.sum(weighted_outcome_trt) / np.sum(n_trt)
+            ) = self.make_overlap_adjustments(ps)  # type: ignore[assignment]
+            ntrt = np.sum(weighted_outcome_ntrt) / np.sum(n_ntrt)  # type: ignore[arg-type]
+            trt = np.sum(weighted_outcome_trt) / np.sum(n_trt)  # type: ignore[arg-type]
         else:
             (
                 weighted_outcome_ntrt,
                 weighted_outcome_trt,
                 n_ntrt,
                 n_trt,
-            ) = self.make_doubly_robust_adjustment(ps)
+            ) = self.make_doubly_robust_adjustment(ps)  # type: ignore[assignment]
             trt = np.mean(weighted_outcome_trt)
             ntrt = np.mean(weighted_outcome_ntrt)
         ate = trt - ntrt
         return [ate, trt, ntrt]
 
     def plot_ate(
-        self, idata=None, method=None, prop_draws=100, ate_draws=300
+        self,
+        idata: az.InferenceData | None = None,
+        method: str | None = None,
+        prop_draws: int = 100,
+        ate_draws: int = 300,
     ) -> tuple[plt.Figure, List[plt.Axes]]:
         if idata is None:
             idata = self.model.idata
@@ -376,7 +390,9 @@ def make_hists(idata, i, axs, method=method):
 
         return fig, axs
 
-    def weighted_percentile(self, data, weights, perc):
+    def weighted_percentile(
+        self, data: np.ndarray, weights: np.ndarray, perc: float
+    ) -> float:
         """
         perc : percentile in [0-1]!
         """
@@ -391,7 +407,10 @@ def weighted_percentile(self, data, weights, perc):
         return np.interp(perc, cdf, data)
 
     def plot_balance_ecdf(
-        self, covariate, idata=None, weighting_scheme=None
+        self,
+        covariate: str,
+        idata: az.InferenceData | None = None,
+        weighting_scheme: str | None = None,
     ) -> tuple[plt.Figure, List[plt.Axes]]:
         """
         Plotting function takes a single covariate and shows the
diff --git a/causalpy/experiments/prepostnegd.py b/causalpy/experiments/prepostnegd.py
index d6a48af7..f67b0008 100644
--- a/causalpy/experiments/prepostnegd.py
+++ b/causalpy/experiments/prepostnegd.py
@@ -94,9 +94,9 @@ def __init__(
         formula: str,
         group_variable_name: str,
         pretreatment_variable_name: str,
-        model=None,
-        **kwargs,
-    ):
+        model: PyMCModel | None = None,
+        **kwargs: dict,
+    ) -> None:
         super().__init__(model=model)
         self.causal_impact: xr.DataArray
         self.pred_xi: np.ndarray
@@ -202,7 +202,7 @@ def _get_treatment_effect_coeff(self) -> str:
 
         raise NameError("Unable to find coefficient name for the treatment effect")
 
-    def _causal_impact_summary_stat(self, round_to) -> str:
+    def _causal_impact_summary_stat(self, round_to: int | None = 2) -> str:
         """Computes the mean and 94% credible interval bounds for the causal impact."""
         percentiles = self.causal_impact.quantile([0.03, 1 - 0.03]).values
         ci = (
@@ -212,7 +212,7 @@ def _causal_impact_summary_stat(self, round_to) -> str:
         causal_impact = f"{round_num(self.causal_impact.mean(), round_to)}, "
         return f"Causal impact = {causal_impact + ci}"
 
-    def summary(self, round_to=None) -> None:
+    def summary(self, round_to: int | None = None) -> None:
         """Print summary of main results and model coefficients.
 
         :param round_to:
@@ -226,7 +226,7 @@ def summary(self, round_to=None) -> None:
         self.print_coefficients(round_to)
 
     def _bayesian_plot(
-        self, round_to=None, **kwargs
+        self, round_to: int | None = None, **kwargs: dict
     ) -> tuple[plt.Figure, List[plt.Axes]]:
         """Generate plot for ANOVA-like experiments with non-equivalent group designs."""
         fig, ax = plt.subplots(
diff --git a/causalpy/experiments/regression_discontinuity.py b/causalpy/experiments/regression_discontinuity.py
index ec24ba0b..8f4d45bb 100644
--- a/causalpy/experiments/regression_discontinuity.py
+++ b/causalpy/experiments/regression_discontinuity.py
@@ -16,6 +16,8 @@
 """
 
 import warnings  # noqa: I001
+from typing import Union
+
 
 import numpy as np
 import pandas as pd
@@ -86,12 +88,12 @@ def __init__(
         data: pd.DataFrame,
         formula: str,
         treatment_threshold: float,
-        model=None,
+        model: Union[PyMCModel, RegressorMixin] | None = None,
         running_variable_name: str = "x",
         epsilon: float = 0.001,
         bandwidth: float = np.inf,
-        **kwargs,
-    ):
+        **kwargs: dict,
+    ) -> None:
         super().__init__(model=model)
         self.expt_type = "Regression Discontinuity"
         self.data = data
@@ -198,7 +200,7 @@ def __init__(
             ) - np.squeeze(self.pred_discon[0])
         # ******************************************************************************
 
-    def input_validation(self):
+    def input_validation(self) -> None:
         """Validate the input data and model formula for correctness"""
         if "treated" not in self.formula:
             raise FormulaException(
@@ -216,7 +218,7 @@ def input_validation(self):
             self.data = self.data.copy()
             self.data["treated"] = self.data["treated"].astype(bool)
 
-    def _is_treated(self, x):
+    def _is_treated(self, x: Union[np.ndarray, pd.Series]) -> np.ndarray:
         """Returns ``True`` if `x` is greater than or equal to the treatment threshold.
 
         .. warning::
@@ -225,7 +227,7 @@ def _is_treated(self, x):
         """
         return np.greater_equal(x, self.treatment_threshold)
 
-    def summary(self, round_to=None) -> None:
+    def summary(self, round_to: int | None = None) -> None:
         """
         Print summary of main results and model coefficients
 
@@ -243,7 +245,9 @@ def summary(self, round_to=None) -> None:
         print("\n")
         self.print_coefficients(round_to)
 
-    def _bayesian_plot(self, round_to=None, **kwargs) -> tuple[plt.Figure, plt.Axes]:
+    def _bayesian_plot(
+        self, round_to: int | None = 2, **kwargs: dict
+    ) -> tuple[plt.Figure, plt.Axes]:
         """Generate plot for regression discontinuity designs."""
         fig, ax = plt.subplots()
         # Plot raw data
@@ -292,7 +296,9 @@ def _bayesian_plot(self, round_to=None, **kwargs) -> tuple[plt.Figure, plt.Axes]
         )
         return (fig, ax)
 
-    def _ols_plot(self, round_to=None, **kwargs) -> tuple[plt.Figure, plt.Axes]:
+    def _ols_plot(
+        self, round_to: int | None = None, **kwargs: dict
+    ) -> tuple[plt.Figure, plt.Axes]:
         """Generate plot for regression discontinuity designs."""
         fig, ax = plt.subplots()
         # Plot raw data
@@ -312,7 +318,7 @@ def _ols_plot(self, round_to=None, **kwargs) -> tuple[plt.Figure, plt.Axes]:
             label="model fit",
         )
         # create strings to compose title
-        r2 = f"$R^2$ on all data = {round_num(self.score, round_to)}"
+        r2 = f"$R^2$ on all data = {round_num(float(self.score), round_to)}"
         discon = f"Discontinuity at threshold = {round_num(self.discontinuity_at_threshold, round_to)}"
         ax.set(title=r2 + "\n" + discon)
         # Intervention line
diff --git a/causalpy/experiments/regression_kink.py b/causalpy/experiments/regression_kink.py
index 9e1f3aa5..62af07b6 100644
--- a/causalpy/experiments/regression_kink.py
+++ b/causalpy/experiments/regression_kink.py
@@ -17,6 +17,8 @@
 """
 
 import warnings  # noqa: I001
+from typing import Union
+
 
 from matplotlib import pyplot as plt
 import numpy as np
@@ -49,12 +51,12 @@ def __init__(
         data: pd.DataFrame,
         formula: str,
         kink_point: float,
-        model=None,
+        model: BaseExperiment | None = None,
         running_variable_name: str = "x",
         epsilon: float = 0.001,
         bandwidth: float = np.inf,
-        **kwargs,
-    ):
+        **kwargs: dict,
+    ) -> None:
         super().__init__(model=model)
         self.expt_type = "Regression Kink"
         self.data = data
@@ -130,7 +132,7 @@ def __init__(
             mu_kink_left, mu_kink, mu_kink_right, epsilon
         )
 
-    def input_validation(self):
+    def input_validation(self) -> None:
         """Validate the input data and model formula for correctness"""
         if "treated" not in self.formula:
             raise FormulaException(
@@ -149,7 +151,12 @@ def input_validation(self):
             raise ValueError("Epsilon must be greater than zero.")
 
     @staticmethod
-    def _eval_gradient_change(mu_kink_left, mu_kink, mu_kink_right, epsilon):
+    def _eval_gradient_change(
+        mu_kink_left: xr.DataArray,
+        mu_kink: xr.DataArray,
+        mu_kink_right: xr.DataArray,
+        epsilon: float,
+    ) -> xr.DataArray:
         """Evaluate the gradient change at the kink point.
         It works by evaluating the model below the kink point, at the kink point,
         and above the kink point.
@@ -160,7 +167,7 @@ def _eval_gradient_change(mu_kink_left, mu_kink, mu_kink_right, epsilon):
         gradient_change = gradient_right - gradient_left
         return gradient_change
 
-    def _probe_kink_point(self):
+    def _probe_kink_point(self) -> tuple[xr.DataArray, xr.DataArray, xr.DataArray]:
         """Probe the kink point to evaluate the predicted outcome at the kink point and
         either side."""
         # Create a dataframe to evaluate predicted outcome at the kink point and either
@@ -185,11 +192,11 @@ def _probe_kink_point(self):
         mu_kink_right = predicted["posterior_predictive"].sel(obs_ind=2)["mu"]
         return mu_kink_left, mu_kink, mu_kink_right
 
-    def _is_treated(self, x):
+    def _is_treated(self, x: Union[np.ndarray, pd.Series]) -> np.ndarray:
         """Returns ``True`` if `x` is greater than or equal to the treatment threshold."""  # noqa: E501
         return np.greater_equal(x, self.kink_point)
 
-    def summary(self, round_to=None) -> None:
+    def summary(self, round_to: int | None = 2) -> None:
         """Print summary of main results and model coefficients.
 
         :param round_to:
@@ -203,12 +210,14 @@ def summary(self, round_to=None) -> None:
         Kink point on running variable: {self.kink_point}
 
         Results:
-        Change in slope at kink point = {round_num(self.gradient_change.mean(), round_to)}
+        Change in slope at kink point = {round_num(self.gradient_change.mean(), round_to if round_to is not None else 2)}
         """
         )
         self.print_coefficients(round_to)
 
-    def _bayesian_plot(self, round_to=None, **kwargs) -> tuple[plt.Figure, plt.Axes]:
+    def _bayesian_plot(
+        self, round_to: int | None = 2, **kwargs: dict
+    ) -> tuple[plt.Figure, plt.Axes]:
         """Generate plot for regression kink designs."""
         fig, ax = plt.subplots()
         # Plot raw data
@@ -231,15 +240,15 @@ def _bayesian_plot(self, round_to=None, **kwargs) -> tuple[plt.Figure, plt.Axes]
         labels = ["Posterior mean"]
 
         # create strings to compose title
-        title_info = f"{round_num(self.score['unit_0_r2'], round_to)} (std = {round_num(self.score['unit_0_r2_std'], round_to)})"
+        title_info = f"{round_num(self.score['unit_0_r2'], round_to if round_to is not None else 2)} (std = {round_num(self.score['unit_0_r2_std'], round_to if round_to is not None else 2)})"
         r2 = f"Bayesian $R^2$ on all data = {title_info}"
         percentiles = self.gradient_change.quantile([0.03, 1 - 0.03]).values
         ci = (
             r"$CI_{94\%}$"
-            + f"[{round_num(percentiles[0], round_to)}, {round_num(percentiles[1], round_to)}]"
+            + f"[{round_num(percentiles[0], round_to if round_to is not None else 2)}, {round_num(percentiles[1], round_to if round_to is not None else 2)}]"
         )
         grad_change = f"""
-            Change in gradient = {round_num(self.gradient_change.mean(), round_to)},
+            Change in gradient = {round_num(self.gradient_change.mean(), round_to if round_to is not None else 2)},
             """
         ax.set(title=r2 + "\n" + grad_change + ci)
         # Intervention line
diff --git a/causalpy/experiments/synthetic_control.py b/causalpy/experiments/synthetic_control.py
index c1060638..3a1692e0 100644
--- a/causalpy/experiments/synthetic_control.py
+++ b/causalpy/experiments/synthetic_control.py
@@ -15,7 +15,7 @@
 Synthetic Control Experiment
 """
 
-from typing import List, Optional, Union
+from typing import List, Union
 
 import arviz as az
 import numpy as np
@@ -86,8 +86,8 @@ def __init__(
         treatment_time: Union[int, float, pd.Timestamp],
         control_units: list[str],
         treated_units: list[str],
-        model=None,
-        **kwargs,
+        model: Union[PyMCModel, RegressorMixin] | None = None,
+        **kwargs: dict,
     ) -> None:
         super().__init__(model=model)
         # rename the index to "obs_ind"
@@ -185,7 +185,9 @@ def __init__(
             self.post_impact
         )
 
-    def input_validation(self, data, treatment_time):
+    def input_validation(
+        self, data: pd.DataFrame, treatment_time: Union[int, float, pd.Timestamp]
+    ) -> None:
         """Validate the input data and model formula for correctness"""
         if isinstance(data.index, pd.DatetimeIndex) and not isinstance(
             treatment_time, pd.Timestamp
@@ -200,7 +202,7 @@ def input_validation(self, data, treatment_time):
                 "If data.index is not DatetimeIndex, treatment_time must be pd.Timestamp."  # noqa: E501
             )
 
-    def summary(self, round_to=None) -> None:
+    def summary(self, round_to: int | None = None) -> None:
         """Print summary of main results and model coefficients.
 
         :param round_to:
@@ -215,7 +217,10 @@ def summary(self, round_to=None) -> None:
         self.print_coefficients(round_to)
 
     def _bayesian_plot(
-        self, round_to=None, treated_unit: str | None = None, **kwargs
+        self,
+        round_to: int | None = None,
+        treated_unit: str | None = None,
+        **kwargs: dict,
     ) -> tuple[plt.Figure, List[plt.Axes]]:
         """
         Plot the results for a specific treated unit
@@ -366,7 +371,10 @@ def _bayesian_plot(
         return fig, ax
 
     def _ols_plot(
-        self, round_to=None, treated_unit: str | None = None, **kwargs
+        self,
+        round_to: int | None = None,
+        treated_unit: str | None = None,
+        **kwargs: dict,
     ) -> tuple[plt.Figure, List[plt.Axes]]:
         """
         Plot the results for OLS model for a specific treated unit
@@ -569,16 +577,20 @@ def get_plot_data_bayesian(
 
         return self.plot_data
 
-    def _get_score_title(
-        self, treated_unit: str, round_to: Optional[int] = None
-    ) -> str:
+    def _get_score_title(self, treated_unit: str, round_to: int | None = 2) -> str:
         """Generate appropriate score title for the specified treated unit"""
         if isinstance(self.model, PyMCModel):
             # Bayesian model - get unit-specific R² scores using unified format
             unit_index = self.treated_units.index(treated_unit)
-            r2_val = round_num(self.score[f"unit_{unit_index}_r2"], round_to)
-            r2_std_val = round_num(self.score[f"unit_{unit_index}_r2_std"], round_to)
+            r2_val = round_num(
+                self.score[f"unit_{unit_index}_r2"],
+                round_to if round_to is not None else 2,
+            )
+            r2_std_val = round_num(
+                self.score[f"unit_{unit_index}_r2_std"],
+                round_to if round_to is not None else 2,
+            )
             return f"Pre-intervention Bayesian $R^2$: {r2_val} (std = {r2_std_val})"
         else:
             # OLS model - simple float score
-            return f"$R^2$ on pre-intervention data = {round_num(self.score, round_to)}"
+            return f"$R^2$ on pre-intervention data = {round_num(float(self.score), round_to if round_to is not None else 2)}"
diff --git a/causalpy/plot_utils.py b/causalpy/plot_utils.py
index 6d134539..b1aba671 100644
--- a/causalpy/plot_utils.py
+++ b/causalpy/plot_utils.py
@@ -15,7 +15,7 @@
 Plotting utility functions.
 """
 
-from typing import Any, Dict, Optional, Tuple, Union
+from typing import Any, Dict, Tuple, Union
 
 import arviz as az
 import matplotlib.pyplot as plt
@@ -31,9 +31,9 @@ def plot_xY(
     x: Union[pd.DatetimeIndex, np.ndarray, pd.Index, pd.Series, ExtensionArray],
     Y: xr.DataArray,
     ax: plt.Axes,
-    plot_hdi_kwargs: Optional[Dict[str, Any]] = None,
+    plot_hdi_kwargs: Dict[str, Any] | None = None,
     hdi_prob: float = 0.94,
-    label: Union[str, None] = None,
+    label: str | None = None,
 ) -> Tuple[Line2D, PolyCollection]:
     """
     Utility function to plot HDI intervals.
diff --git a/causalpy/pymc_models.py b/causalpy/pymc_models.py
index fa8c4df9..b332014d 100644
--- a/causalpy/pymc_models.py
+++ b/causalpy/pymc_models.py
@@ -13,7 +13,7 @@
 #   limitations under the License.
 """Custom PyMC models for causal inference"""
 
-from typing import Any, Dict, Optional
+from typing import Any, Dict
 
 import arviz as az
 import numpy as np
@@ -169,9 +169,9 @@ def priors_from_data(self, X, y) -> Dict[str, Any]:
 
     def __init__(
         self,
-        sample_kwargs: Optional[Dict[str, Any]] = None,
+        sample_kwargs: Dict[str, Any] | None = None,
         priors: dict[str, Any] | None = None,
-    ):
+    ) -> None:
         """
         :param sample_kwargs: A dictionary of kwargs that get unpacked and passed to the
             :func:`pymc.sample` function. Defaults to an empty dictionary.
@@ -182,8 +182,9 @@ def __init__(
 
         self.priors = {**self.default_priors, **(priors or {})}
 
-    def build_model(self, X, y, coords) -> None:
-        """Build the model, must be implemented by subclass."""
+    def build_model(
+        self, X: xr.DataArray, y: xr.DataArray, coords: Dict[str, Any] | None
+    ) -> None:
         raise NotImplementedError(
             "This method must be implemented by a subclass"
         )  # pragma: no cover
@@ -220,7 +221,9 @@ def _data_setter(self, X: xr.DataArray) -> None:
                 coords={"obs_ind": obs_coords},
             )
 
-    def fit(self, X, y, coords: Optional[Dict[str, Any]] = None) -> None:
+    def fit(
+        self, X: xr.DataArray, y: xr.DataArray, coords: Dict[str, Any] | None = None
+    ) -> az.InferenceData:
         """Draw samples from posterior, prior predictive, and posterior predictive
         distributions, placing them in the model's idata attribute.
         """
@@ -246,7 +249,7 @@ def fit(self, X, y, coords: Optional[Dict[str, Any]] = None) -> None:
             )
         return self.idata
 
-    def predict(self, X: xr.DataArray):
+    def predict(self, X: xr.DataArray) -> az.InferenceData:
         """
         Predict data given input data `X`
 
@@ -347,10 +350,12 @@ def calculate_impact(
         impact = y_true - y_pred["posterior_predictive"]["mu"]
         return impact.transpose(..., "obs_ind")
 
-    def calculate_cumulative_impact(self, impact):
+    def calculate_cumulative_impact(self, impact: xr.DataArray) -> xr.DataArray:
         return impact.cumsum(dim="obs_ind")
 
-    def print_coefficients(self, labels, round_to=None) -> None:
+    def print_coefficients(
+        self, labels: list[str], round_to: int | None = None
+    ) -> None:
         if self.idata is None:
             raise RuntimeError("Model has not been fit")
 
@@ -451,13 +456,15 @@ class LinearRegression(PyMCModel):
         ),
     }
 
-    def build_model(self, X, y, coords):
+    def build_model(
+        self, X: xr.DataArray, y: xr.DataArray, coords: Dict[str, Any] | None
+    ) -> None:
         """
         Defines the PyMC model
         """
         with self:
             # Ensure treated_units coordinate exists for consistency
-            if "treated_units" not in coords:
+            if coords is not None and "treated_units" not in coords:
                 coords = coords.copy()
                 coords["treated_units"] = ["unit_0"]
 
@@ -548,7 +555,9 @@ def priors_from_data(self, X, y) -> Dict[str, Any]:
             ),
         }
 
-    def build_model(self, X, y, coords):
+    def build_model(
+        self, X: xr.DataArray, y: xr.DataArray, coords: Dict[str, Any] | None
+    ) -> None:
         """
         Defines the PyMC model
         """
@@ -609,7 +618,15 @@ class InstrumentalVariableRegression(PyMCModel):
     Inference data...
     """
 
-    def build_model(self, X, Z, y, t, coords, priors):
+    def build_model(  # type: ignore
+        self,
+        X: np.ndarray,
+        Z: np.ndarray,
+        y: np.ndarray,
+        t: np.ndarray,
+        coords: Dict[str, Any],
+        priors: Dict[str, Any],
+    ) -> None:
         """Specify model with treatment regression and focal regression data and priors
 
         :param X: A pandas dataframe used to predict our outcome y
@@ -666,7 +683,7 @@ def build_model(self, X, Z, y, t, coords, priors):
                 shape=(X.shape[0], 2),
             )
 
-    def sample_predictive_distribution(self, ppc_sampler="jax"):
+    def sample_predictive_distribution(self, ppc_sampler: str | None = "jax") -> None:
         """Function to sample the Multivariate Normal posterior predictive
         Likelihood term in the IV class. This can be slow without
         using the JAX sampler compilation method. If using the
@@ -676,25 +693,38 @@ def sample_predictive_distribution(self, ppc_sampler="jax"):
         random_seed = self.sample_kwargs.get("random_seed", None)
 
         if ppc_sampler == "jax":
-            with self:
-                self.idata.extend(
-                    pm.sample_posterior_predictive(
-                        self.idata,
-                        random_seed=random_seed,
-                        compile_kwargs={"mode": "JAX"},
+            if self.idata is not None:
+                with self:
+                    self.idata.extend(
+                        pm.sample_posterior_predictive(
+                            self.idata,
+                            random_seed=random_seed,
+                            compile_kwargs={"mode": "JAX"},
+                        )
                     )
-                )
         elif ppc_sampler == "pymc":
-            with self:
-                self.idata.extend(pm.sample_prior_predictive(random_seed=random_seed))
-                self.idata.extend(
-                    pm.sample_posterior_predictive(
-                        self.idata,
-                        random_seed=random_seed,
+            if self.idata is not None:
+                with self:
+                    self.idata.extend(
+                        pm.sample_prior_predictive(random_seed=random_seed)
+                    )
+                    self.idata.extend(
+                        pm.sample_posterior_predictive(
+                            self.idata,
+                            random_seed=random_seed,
+                        )
                     )
-                )
 
-    def fit(self, X, Z, y, t, coords, priors, ppc_sampler=None):
+    def fit(  # type: ignore
+        self,
+        X: np.ndarray,
+        Z: np.ndarray,
+        y: np.ndarray,
+        t: np.ndarray,
+        coords: Dict[str, Any],
+        priors: Dict[str, Any],
+        ppc_sampler: str | None = None,
+    ) -> az.InferenceData:
         """Draw samples from posterior distribution and potentially
         from the prior and posterior predictive distributions. The
         fit call can take values for the
@@ -754,7 +784,14 @@ class PropensityScore(PyMCModel):
         "b": Prior("Normal", mu=0, sigma=1, dims="coeffs"),
     }
 
-    def build_model(self, X, t, coords, prior=None, noncentred=True):
+    def build_model(  # type: ignore
+        self,
+        X: np.ndarray,
+        t: np.ndarray,
+        coords: Dict[str, Any],
+        prior: Dict[str, Any] | None = None,
+        noncentred: bool = True,
+    ) -> None:
         "Defines the PyMC propensity model"
         with self:
             self.add_coords(coords)
@@ -765,7 +802,14 @@ def build_model(self, X, t, coords, prior=None, noncentred=True):
             p = pm.Deterministic("p", pm.math.invlogit(mu))
             pm.Bernoulli("t_pred", p=p, observed=t_data, dims="obs_ind")
 
-    def fit(self, X, t, coords, prior={"b": [0, 1]}, noncentred=True):
+    def fit(  # type: ignore
+        self,
+        X: np.ndarray,
+        t: np.ndarray,
+        coords: Dict[str, Any],
+        prior: Dict[str, list] = {"b": [0, 1]},
+        noncentred: bool = True,
+    ) -> az.InferenceData:
         """Draw samples from posterior, prior predictive, and posterior predictive
         distributions. We overwrite the base method because the base method assumes
         a variable y and we use t to indicate the treatment variable here.
@@ -777,29 +821,30 @@ def fit(self, X, t, coords, prior={"b": [0, 1]}, noncentred=True):
         self.build_model(X, t, coords, prior, noncentred)
         with self:
             self.idata = pm.sample(**self.sample_kwargs)
-            self.idata.extend(pm.sample_prior_predictive(random_seed=random_seed))
-            self.idata.extend(
-                pm.sample_posterior_predictive(
-                    self.idata, progressbar=False, random_seed=random_seed
+            if self.idata is not None:
+                self.idata.extend(pm.sample_prior_predictive(random_seed=random_seed))
+                self.idata.extend(
+                    pm.sample_posterior_predictive(
+                        self.idata, progressbar=False, random_seed=random_seed
+                    )
                 )
-            )
         return self.idata
 
     def fit_outcome_model(
         self,
-        X_outcome,
-        y,
-        coords,
-        priors={
+        X_outcome: pd.DataFrame,
+        y: pd.Series,
+        coords: Dict[str, Any],
+        priors: Dict[str, Any] = {
             "b_outcome": [0, 1],
             "sigma": 1,
             "beta_ps": [0, 1],
         },
-        noncentred=True,
-        normal_outcome=True,
-        spline_component=False,
-        winsorize_boundary=0.0,
-    ):
+        noncentred: bool = True,
+        normal_outcome: bool = True,
+        spline_component: bool = False,
+        winsorize_boundary: float = 0.0,
+    ) -> tuple[az.InferenceData, pm.Model]:
         """
         Fit a Bayesian outcome model using covariates and previously estimated propensity scores.
 
diff --git a/causalpy/skl_models.py b/causalpy/skl_models.py
index 5aaca205..8383dc87 100644
--- a/causalpy/skl_models.py
+++ b/causalpy/skl_models.py
@@ -26,15 +26,19 @@
 class ScikitLearnAdaptor:
     """Base class for scikit-learn models that can be used for causal inference."""
 
-    def calculate_impact(self, y_true, y_pred):
+    coef_: np.ndarray
+
+    def calculate_impact(self, y_true: np.ndarray, y_pred: np.ndarray) -> np.ndarray:
         """Calculate the causal impact of the intervention."""
         return y_true - y_pred
 
-    def calculate_cumulative_impact(self, impact):
+    def calculate_cumulative_impact(self, impact: np.ndarray) -> np.ndarray:
         """Calculate the cumulative impact intervention."""
         return np.cumsum(impact)
 
-    def print_coefficients(self, labels, round_to=None) -> None:
+    def print_coefficients(
+        self, labels: list[str], round_to: int | None = None
+    ) -> None:
         """Print the coefficients of the model with the corresponding labels."""
         print("Model coefficients:")
         coef_ = self.get_coeffs()
@@ -45,10 +49,12 @@ def print_coefficients(self, labels, round_to=None) -> None:
             # Left-align the name
             formatted_name = f"{name:<{max_label_length}}"
             # Right-align the value with width 10
-            formatted_val = f"{round_num(val, round_to):>10}"
+            formatted_val = (
+                f"{round_num(val, round_to if round_to is not None else 2):>10}"
+            )
             print(f"  {formatted_name}\t{formatted_val}")
 
-    def get_coeffs(self):
+    def get_coeffs(self) -> np.ndarray:
         """Get the coefficients of the model as a numpy array."""
         return np.squeeze(self.coef_)
 
@@ -57,11 +63,11 @@ class WeightedProportion(ScikitLearnAdaptor, LinearModel, RegressorMixin):
     """Weighted proportion model for causal inference. Used for synthetic control
     methods for example"""
 
-    def loss(self, W, X, y):
+    def loss(self, W: np.ndarray, X: np.ndarray, y: np.ndarray) -> float:
         """Compute root mean squared loss with data X, weights W, and predictor y"""
         return np.sqrt(np.mean((y - np.dot(X, W.T)) ** 2))
 
-    def fit(self, X, y):
+    def fit(self, X: np.ndarray, y: np.ndarray) -> "WeightedProportion":
         """Fit model on data X with predictor y"""
         w_start = [1 / X.shape[1]] * X.shape[1]
         coef_ = fmin_slsqp(
@@ -75,7 +81,7 @@ def fit(self, X, y):
         self.mse = self.loss(W=self.coef_, X=X, y=y)
         return self
 
-    def predict(self, X):
+    def predict(self, X: np.ndarray) -> np.ndarray:
         """Predict results for data X"""
         return np.dot(X, self.coef_.T)
 
@@ -89,7 +95,9 @@ def create_causalpy_compatible_class(
     return estimator
 
 
-def _add_mixin_methods(model_instance, mixin_class):
+def _add_mixin_methods(
+    model_instance: RegressorMixin, mixin_class: type
+) -> RegressorMixin:
     """Utility function to bind mixin methods to an existing model instance."""
     for attr_name in dir(mixin_class):
         attr = getattr(mixin_class, attr_name)
diff --git a/causalpy/utils.py b/causalpy/utils.py
index 5b7c601b..997c93ba 100644
--- a/causalpy/utils.py
+++ b/causalpy/utils.py
@@ -34,7 +34,7 @@ def _series_has_2_levels(series: pd.Series) -> bool:
     return len(pd.Categorical(series).categories) == 2
 
 
-def round_num(n, round_to):
+def round_num(n: float, round_to: int | None) -> str:
     """
     Return a string representing a number with `round_to` significant figures.
 
@@ -42,14 +42,14 @@ def round_num(n, round_to):
     ----------
     n : float
         number to round
-    round_to : int
+    round_to : int, optional
         number of significant figures
     """
     sig_figs = _format_sig_figs(n, round_to)
     return f"{n:.{sig_figs}g}"
 
 
-def _format_sig_figs(value, default=None):
+def _format_sig_figs(value: float, default: int | None = None) -> int:
     """Get a default number of significant figures.
 
     Gives the integer part or `default`, whichever is bigger.
@@ -68,7 +68,7 @@ def _format_sig_figs(value, default=None):
     return max(int(np.log10(np.abs(value))) + 1, default)
 
 
-def convert_to_string(x: Union[float, xr.DataArray], round_to: int = 2) -> str:
+def convert_to_string(x: Union[float, xr.DataArray], round_to: int | None = 2) -> str:
     """Utility function which takes in numeric inputs and returns a string."""
     if isinstance(x, float):
         # In the case of a float, we return the number rounded to 2 decimal places
diff --git a/docs/source/_static/interrogate_badge.svg b/docs/source/_static/interrogate_badge.svg
index 26433625..aa85b1ad 100644
--- a/docs/source/_static/interrogate_badge.svg
+++ b/docs/source/_static/interrogate_badge.svg
@@ -1,5 +1,5 @@
 <svg width="140" height="20" viewBox="0 0 140 20" version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xml:space="preserve" xmlns:serif="http://www.serif.com/" style="fill-rule:evenodd;clip-rule:evenodd;stroke-linejoin:round;stroke-miterlimit:2;">
-    <title>interrogate: 95.9%</title>
+    <title>interrogate: 95.1%</title>
     <g transform="matrix(1,0,0,1,22,0)">
         <g id="backgrounds" transform="matrix(1.32789,0,0,1,-22.3892,0)">
             <rect x="0" y="0" width="71" height="20" style="fill:rgb(85,85,85);"/>
@@ -12,8 +12,8 @@
     <g fill="#fff" text-anchor="middle" font-family="DejaVu Sans,Verdana,Geneva,sans-serif" font-size="110">
         <text x="590" y="150" fill="#010101" fill-opacity=".3" transform="scale(.1)" textLength="610">interrogate</text>
         <text x="590" y="140" transform="scale(.1)" textLength="610">interrogate</text>
-        <text x="1160" y="150" fill="#010101" fill-opacity=".3" transform="scale(.1)" textLength="370" data-interrogate="result">95.9%</text>
-        <text x="1160" y="140" transform="scale(.1)" textLength="370" data-interrogate="result">95.9%</text>
+        <text x="1160" y="150" fill="#010101" fill-opacity=".3" transform="scale(.1)" textLength="370" data-interrogate="result">95.1%</text>
+        <text x="1160" y="140" transform="scale(.1)" textLength="370" data-interrogate="result">95.1%</text>
     </g>
     <g id="logo-shadow" serif:id="logo shadow" transform="matrix(0.854876,0,0,0.854876,-6.73514,1.732)">
         <g transform="matrix(0.299012,0,0,0.299012,9.70229,-6.68582)">

From b226a9dbcd5ecec265f7d6486e7bb7b754cd2da3 Mon Sep 17 00:00:00 2001
From: juanitorduz <juanitorduz@gmail.com>
Date: Wed, 12 Nov 2025 11:45:57 +0100
Subject: [PATCH 2/6] rm file

---
 docs/source/_static/interrogate_badge.svg | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/docs/source/_static/interrogate_badge.svg b/docs/source/_static/interrogate_badge.svg
index aa85b1ad..8734d55d 100644
--- a/docs/source/_static/interrogate_badge.svg
+++ b/docs/source/_static/interrogate_badge.svg
@@ -1,5 +1,5 @@
 <svg width="140" height="20" viewBox="0 0 140 20" version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xml:space="preserve" xmlns:serif="http://www.serif.com/" style="fill-rule:evenodd;clip-rule:evenodd;stroke-linejoin:round;stroke-miterlimit:2;">
-    <title>interrogate: 95.1%</title>
+    <title>interrogate: 95.8%</title>
     <g transform="matrix(1,0,0,1,22,0)">
         <g id="backgrounds" transform="matrix(1.32789,0,0,1,-22.3892,0)">
             <rect x="0" y="0" width="71" height="20" style="fill:rgb(85,85,85);"/>
@@ -12,8 +12,8 @@
     <g fill="#fff" text-anchor="middle" font-family="DejaVu Sans,Verdana,Geneva,sans-serif" font-size="110">
         <text x="590" y="150" fill="#010101" fill-opacity=".3" transform="scale(.1)" textLength="610">interrogate</text>
         <text x="590" y="140" transform="scale(.1)" textLength="610">interrogate</text>
-        <text x="1160" y="150" fill="#010101" fill-opacity=".3" transform="scale(.1)" textLength="370" data-interrogate="result">95.1%</text>
-        <text x="1160" y="140" transform="scale(.1)" textLength="370" data-interrogate="result">95.1%</text>
+        <text x="1160" y="150" fill="#010101" fill-opacity=".3" transform="scale(.1)" textLength="370" data-interrogate="result">95.8%</text>
+        <text x="1160" y="140" transform="scale(.1)" textLength="370" data-interrogate="result">95.8%</text>
     </g>
     <g id="logo-shadow" serif:id="logo shadow" transform="matrix(0.854876,0,0,0.854876,-6.73514,1.732)">
         <g transform="matrix(0.299012,0,0,0.299012,9.70229,-6.68582)">

From aa0ca3b714cc26c1ced813ba0eb670dc8cb655f4 Mon Sep 17 00:00:00 2001
From: juanitorduz <juanitorduz@gmail.com>
Date: Wed, 12 Nov 2025 11:51:17 +0100
Subject: [PATCH 3/6] update badge

---
 docs/source/_static/interrogate_badge.svg | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/docs/source/_static/interrogate_badge.svg b/docs/source/_static/interrogate_badge.svg
index 8734d55d..aa85b1ad 100644
--- a/docs/source/_static/interrogate_badge.svg
+++ b/docs/source/_static/interrogate_badge.svg
@@ -1,5 +1,5 @@
 <svg width="140" height="20" viewBox="0 0 140 20" version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xml:space="preserve" xmlns:serif="http://www.serif.com/" style="fill-rule:evenodd;clip-rule:evenodd;stroke-linejoin:round;stroke-miterlimit:2;">
-    <title>interrogate: 95.8%</title>
+    <title>interrogate: 95.1%</title>
     <g transform="matrix(1,0,0,1,22,0)">
         <g id="backgrounds" transform="matrix(1.32789,0,0,1,-22.3892,0)">
             <rect x="0" y="0" width="71" height="20" style="fill:rgb(85,85,85);"/>
@@ -12,8 +12,8 @@
     <g fill="#fff" text-anchor="middle" font-family="DejaVu Sans,Verdana,Geneva,sans-serif" font-size="110">
         <text x="590" y="150" fill="#010101" fill-opacity=".3" transform="scale(.1)" textLength="610">interrogate</text>
         <text x="590" y="140" transform="scale(.1)" textLength="610">interrogate</text>
-        <text x="1160" y="150" fill="#010101" fill-opacity=".3" transform="scale(.1)" textLength="370" data-interrogate="result">95.8%</text>
-        <text x="1160" y="140" transform="scale(.1)" textLength="370" data-interrogate="result">95.8%</text>
+        <text x="1160" y="150" fill="#010101" fill-opacity=".3" transform="scale(.1)" textLength="370" data-interrogate="result">95.1%</text>
+        <text x="1160" y="140" transform="scale(.1)" textLength="370" data-interrogate="result">95.1%</text>
     </g>
     <g id="logo-shadow" serif:id="logo shadow" transform="matrix(0.854876,0,0,0.854876,-6.73514,1.732)">
         <g transform="matrix(0.299012,0,0,0.299012,9.70229,-6.68582)">

From 1aaabf1eae8fa257c9fd414990c0bb0fa7df4d7a Mon Sep 17 00:00:00 2001
From: Juan Orduz <juanitorduz@gmail.com>
Date: Wed, 12 Nov 2025 11:53:34 +0100
Subject: [PATCH 4/6] Update causalpy/experiments/regression_kink.py

Co-authored-by: Copilot <175728472+Copilot@users.noreply.github.com>
---
 causalpy/experiments/regression_kink.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/causalpy/experiments/regression_kink.py b/causalpy/experiments/regression_kink.py
index 62af07b6..fe58e079 100644
--- a/causalpy/experiments/regression_kink.py
+++ b/causalpy/experiments/regression_kink.py
@@ -210,7 +210,7 @@ def summary(self, round_to: int | None = 2) -> None:
         Kink point on running variable: {self.kink_point}
 
         Results:
-        Change in slope at kink point = {round_num(self.gradient_change.mean(), round_to if round_to is not None else 2)}
+        Change in slope at kink point = {round_num(self.gradient_change.mean(), round_to)}
         """
         )
         self.print_coefficients(round_to)

From 82ed06dc90ed885e21c8d0b1b227e14b80eb7201 Mon Sep 17 00:00:00 2001
From: juanitorduz <juanitorduz@gmail.com>
Date: Wed, 12 Nov 2025 11:58:19 +0100
Subject: [PATCH 5/6] update docstrings

---
 causalpy/data/datasets.py                     |  17 ++-
 causalpy/experiments/base.py                  |   9 +-
 causalpy/experiments/diff_in_diff.py          |  32 +++---
 causalpy/experiments/instrumental_variable.py |  49 ++++----
 .../inverse_propensity_weighting.py           |  31 ++---
 causalpy/plot_utils.py                        |  56 +++++----
 causalpy/pymc_models.py                       | 108 ++++++++++++++----
 causalpy/skl_models.py                        |  11 +-
 causalpy/utils.py                             |  34 +++++-
 docs/source/_static/interrogate_badge.svg     |   6 +-
 10 files changed, 242 insertions(+), 111 deletions(-)

diff --git a/causalpy/data/datasets.py b/causalpy/data/datasets.py
index 9a463982..40085799 100644
--- a/causalpy/data/datasets.py
+++ b/causalpy/data/datasets.py
@@ -49,9 +49,22 @@ def _get_data_home() -> pathlib.Path:
 
 
 def load_data(dataset: str | None = None) -> pd.DataFrame:
-    """Loads the requested dataset and returns a pandas DataFrame.
+    """Load the requested dataset and return a pandas DataFrame.
 
-    :param dataset: The desired dataset to load
+    Parameters
+    ----------
+    dataset : str, optional
+        The desired dataset to load. If None, raises ValueError.
+
+    Returns
+    -------
+    pd.DataFrame
+        The loaded dataset as a pandas DataFrame.
+
+    Raises
+    ------
+    ValueError
+        If the requested dataset is not found.
     """
 
     if dataset in DATASETS:
diff --git a/causalpy/experiments/base.py b/causalpy/experiments/base.py
index 9f0b26ac..b3d3d80d 100644
--- a/causalpy/experiments/base.py
+++ b/causalpy/experiments/base.py
@@ -62,7 +62,14 @@ def idata(self) -> az.InferenceData:
         return self.model.idata
 
     def print_coefficients(self, round_to: int | None = None) -> None:
-        """Ask the model to print its coefficients."""
+        """Ask the model to print its coefficients.
+
+        Parameters
+        ----------
+        round_to : int, optional
+            Number of significant figures to round to. Defaults to None,
+            in which case 2 significant figures are used.
+        """
         self.model.print_coefficients(self.labels, round_to)
 
     def plot(self, *args: Any, **kwargs: Any) -> tuple:
diff --git a/causalpy/experiments/diff_in_diff.py b/causalpy/experiments/diff_in_diff.py
index f0dd87ad..02cb8e6c 100644
--- a/causalpy/experiments/diff_in_diff.py
+++ b/causalpy/experiments/diff_in_diff.py
@@ -49,20 +49,24 @@ class DifferenceInDifferences(BaseExperiment):
 
     .. note::
 
-        There is no pre/post intervention data distinction for DiD, we fit all the
-        data available.
-    :param data:
-        A pandas dataframe
-    :param formula:
-        A statistical model formula
-    :param time_variable_name:
-        Name of the data column for the time variable
-    :param group_variable_name:
-        Name of the data column for the group variable
-    :param post_treatment_variable_name:
-        Name of the data column indicating post-treatment period (default: "post_treatment")
-    :param model:
-        A PyMC model for difference in differences
+        There is no pre/post intervention data distinction for DiD, we fit
+        all the data available.
+
+    Parameters
+    ----------
+    data : pd.DataFrame
+        A pandas dataframe.
+    formula : str
+        A statistical model formula.
+    time_variable_name : str
+        Name of the data column for the time variable.
+    group_variable_name : str
+        Name of the data column for the group variable.
+    post_treatment_variable_name : str, optional
+        Name of the data column indicating post-treatment period.
+        Defaults to "post_treatment".
+    model : PyMCModel or RegressorMixin, optional
+        A PyMC model for difference in differences. Defaults to None.
 
     Example
     --------
diff --git a/causalpy/experiments/instrumental_variable.py b/causalpy/experiments/instrumental_variable.py
index b7cbd737..15427b40 100644
--- a/causalpy/experiments/instrumental_variable.py
+++ b/causalpy/experiments/instrumental_variable.py
@@ -27,31 +27,30 @@
 
 
 class InstrumentalVariable(BaseExperiment):
-    """
-    A class to analyse instrumental variable style experiments.
-
-    :param instruments_data: A pandas dataframe of instruments
-                             for our treatment variable. Should contain
-                             instruments Z, and treatment t
-    :param data: A pandas dataframe of covariates for fitting
-                 the focal regression of interest. Should contain covariates X
-                 including treatment t and outcome y
-    :param instruments_formula: A statistical model formula for
-                                the instrumental stage regression
-                                e.g. t ~ 1 + z1 + z2 + z3
-    :param formula: A statistical model formula for the \n
-                    focal regression e.g. y ~ 1 + t + x1 + x2 + x3
-    :param model: A PyMC model
-    :param priors: An optional dictionary of priors for the
-                   mus and sigmas of both regressions. If priors are not
-                   specified we will substitute MLE estimates for the beta
-                   coefficients. Greater control can be achieved
-                   by specifying the priors directly e.g. priors = {
-                                    "mus": [0, 0],
-                                    "sigmas": [1, 1],
-                                    "eta": 2,
-                                    "lkj_sd": 2,
-                                    }
+    """A class to analyse instrumental variable style experiments.
+
+    Parameters
+    ----------
+    instruments_data : pd.DataFrame
+        A pandas dataframe of instruments for our treatment variable.
+        Should contain instruments Z, and treatment t.
+    data : pd.DataFrame
+        A pandas dataframe of covariates for fitting the focal regression
+        of interest. Should contain covariates X including treatment t and
+        outcome y.
+    instruments_formula : str
+        A statistical model formula for the instrumental stage regression,
+        e.g. ``t ~ 1 + z1 + z2 + z3``.
+    formula : str
+        A statistical model formula for the focal regression,
+        e.g. ``y ~ 1 + t + x1 + x2 + x3``.
+    model : BaseExperiment, optional
+        A PyMC model. Defaults to None.
+    priors : dict, optional
+        Dictionary of priors for the mus and sigmas of both regressions.
+        If priors are not specified we will substitute MLE estimates for
+        the beta coefficients. Example: ``priors = {"mus": [0, 0],
+        "sigmas": [1, 1], "eta": 2, "lkj_sd": 2}``.
 
     Example
     --------
diff --git a/causalpy/experiments/inverse_propensity_weighting.py b/causalpy/experiments/inverse_propensity_weighting.py
index 99cbe7c0..92933203 100644
--- a/causalpy/experiments/inverse_propensity_weighting.py
+++ b/causalpy/experiments/inverse_propensity_weighting.py
@@ -31,22 +31,23 @@
 
 
 class InversePropensityWeighting(BaseExperiment):
-    """
-    A class to analyse inverse propensity weighting experiments.
+    """A class to analyse inverse propensity weighting experiments.
 
-    :param data:
-        A pandas dataframe
-    :param formula:
-        A statistical model formula for the propensity model
-    :param outcome_variable
-        A string denoting the outcome variable in datq to be reweighted
-    :param weighting_scheme:
-        A string denoting which weighting scheme to use among: 'raw', 'robust',
-        'doubly robust' or 'overlap'. See Aronow and Miller "Foundations
-        of Agnostic Statistics" for discussion and computation of these
-        weighting schemes.
-    :param model:
-        A PyMC model
+    Parameters
+    ----------
+    data : pd.DataFrame
+        A pandas dataframe.
+    formula : str
+        A statistical model formula for the propensity model.
+    outcome_variable : str
+        A string denoting the outcome variable in data to be reweighted.
+    weighting_scheme : str
+        A string denoting which weighting scheme to use among: 'raw',
+        'robust', 'doubly robust' or 'overlap'. See Aronow and Miller
+        "Foundations of Agnostic Statistics" for discussion and computation
+        of these weighting schemes.
+    model : BaseExperiment, optional
+        A PyMC model. Defaults to None.
 
     Example
     --------
diff --git a/causalpy/plot_utils.py b/causalpy/plot_utils.py
index b1aba671..2a65d62a 100644
--- a/causalpy/plot_utils.py
+++ b/causalpy/plot_utils.py
@@ -35,21 +35,28 @@ def plot_xY(
     hdi_prob: float = 0.94,
     label: str | None = None,
 ) -> Tuple[Line2D, PolyCollection]:
-    """
-    Utility function to plot HDI intervals.
-
-    :param x:
-        Pandas datetime index or numpy array of x-axis values
-    :param y:
-        Xarray data array of y-axis data
-    :param ax:
-        Matplotlib ax object
-    :param plot_hdi_kwargs:
-        Dictionary of keyword arguments passed to ax.plot()
-    :param hdi_prob:
-        The size of the HDI, default is 0.94
-    :param label:
-        The plot label
+    """Plot HDI intervals.
+
+    Parameters
+    ----------
+    x : pd.DatetimeIndex, np.ndarray, pd.Index, pd.Series, or ExtensionArray
+        Pandas datetime index or numpy array of x-axis values.
+    Y : xr.DataArray
+        Xarray data array of y-axis data.
+    ax : plt.Axes
+        Matplotlib axes object.
+    plot_hdi_kwargs : dict, optional
+        Dictionary of keyword arguments passed to ax.plot().
+    hdi_prob : float, optional
+        The size of the HDI. Default is 0.94.
+    label : str, optional
+        The plot label.
+
+    Returns
+    -------
+    tuple
+        Tuple of (Line2D, PolyCollection) handles for the plot line and
+        HDI patch.
     """
 
     if plot_hdi_kwargs is None:
@@ -86,13 +93,20 @@ def get_hdi_to_df(
     x: xr.DataArray,
     hdi_prob: float = 0.94,
 ) -> pd.DataFrame:
-    """
-    Utility function to calculate and recover HDI intervals.
+    """Calculate and recover HDI intervals.
+
+    Parameters
+    ----------
+    x : xr.DataArray
+        Xarray data array.
+    hdi_prob : float, optional
+        The size of the HDI. Default is 0.94.
 
-    :param x:
-        Xarray data array
-    :param hdi_prob:
-        The size of the HDI, default is 0.94
+    Returns
+    -------
+    pd.DataFrame
+        DataFrame containing the HDI intervals with 'lower' and 'higher'
+        columns.
     """
     hdi_result = az.hdi(x, hdi_prob=hdi_prob)
 
diff --git a/causalpy/pymc_models.py b/causalpy/pymc_models.py
index b332014d..e4f82624 100644
--- a/causalpy/pymc_models.py
+++ b/causalpy/pymc_models.py
@@ -173,8 +173,15 @@ def __init__(
         priors: dict[str, Any] | None = None,
     ) -> None:
         """
-        :param sample_kwargs: A dictionary of kwargs that get unpacked and passed to the
-            :func:`pymc.sample` function. Defaults to an empty dictionary.
+        Parameters
+        ----------
+        sample_kwargs : dict, optional
+            Dictionary of kwargs that get unpacked and passed to the
+            :func:`pymc.sample` function. Defaults to an empty dictionary
+            if None.
+        priors : dict, optional
+            Dictionary of priors for the model. Defaults to None, in which
+            case default priors are used.
         """
         super().__init__()
         self.idata = None
@@ -224,8 +231,23 @@ def _data_setter(self, X: xr.DataArray) -> None:
     def fit(
         self, X: xr.DataArray, y: xr.DataArray, coords: Dict[str, Any] | None = None
     ) -> az.InferenceData:
-        """Draw samples from posterior, prior predictive, and posterior predictive
-        distributions, placing them in the model's idata attribute.
+        """Draw samples from posterior, prior predictive, and posterior
+        predictive distributions.
+
+        Parameters
+        ----------
+        X : xr.DataArray
+            Input features as an xarray DataArray.
+        y : xr.DataArray
+            Target variable as an xarray DataArray.
+        coords : dict, optional
+            Dictionary with coordinate names for named dimensions.
+            Defaults to None.
+
+        Returns
+        -------
+        az.InferenceData
+            InferenceData object containing the samples.
         """
 
         # Ensure random_seed is used in sample_prior_predictive() and
@@ -356,6 +378,16 @@ def calculate_cumulative_impact(self, impact: xr.DataArray) -> xr.DataArray:
     def print_coefficients(
         self, labels: list[str], round_to: int | None = None
     ) -> None:
+        """Print the model coefficients with their labels.
+
+        Parameters
+        ----------
+        labels : list of str
+            List of strings representing the coefficient names.
+        round_to : int, optional
+            Number of significant figures to round to. Defaults to None,
+            in which case 2 significant figures are used.
+        """
         if self.idata is None:
             raise RuntimeError("Model has not been fit")
 
@@ -627,19 +659,27 @@ def build_model(  # type: ignore
         coords: Dict[str, Any],
         priors: Dict[str, Any],
     ) -> None:
-        """Specify model with treatment regression and focal regression data and priors
-
-        :param X: A pandas dataframe used to predict our outcome y
-        :param Z: A pandas dataframe used to predict our treatment variable t
-        :param y: An array of values representing our focal outcome y
-        :param t: An array of values representing the treatment t of
-                  which we're interested in estimating the causal impact
-        :param coords: A dictionary with the coordinate names for our
-                       instruments and covariates
-        :param priors: An optional dictionary of priors for the mus and
-                      sigmas of both regressions
-                      :code:`priors = {"mus": [0, 0], "sigmas": [1, 1],
-                      "eta": 2, "lkj_sd": 2}`
+        """Specify model with treatment regression and focal regression
+        data and priors.
+
+        Parameters
+        ----------
+        X : np.ndarray
+            Array used to predict our outcome y.
+        Z : np.ndarray
+            Array used to predict our treatment variable t.
+        y : np.ndarray
+            Array of values representing our focal outcome y.
+        t : np.ndarray
+            Array representing the treatment t of which we're interested
+            in estimating the causal impact.
+        coords : dict
+            Dictionary with the coordinate names for our instruments and
+            covariates.
+        priors : dict
+            Dictionary of priors for the mus and sigmas of both
+            regressions. Example: ``priors = {"mus": [0, 0],
+            "sigmas": [1, 1], "eta": 2, "lkj_sd": 2}``.
         """
 
         # --- Priors ---
@@ -725,13 +765,33 @@ def fit(  # type: ignore
         priors: Dict[str, Any],
         ppc_sampler: str | None = None,
     ) -> az.InferenceData:
-        """Draw samples from posterior distribution and potentially
-        from the prior and posterior predictive distributions. The
-        fit call can take values for the
-        ppc_sampler = ['jax', 'pymc', None]
-        We default to None, so the user can determine if they wish
-        to spend time sampling the posterior predictive distribution
-        independently.
+        """Draw samples from posterior distribution and potentially from
+        the prior and posterior predictive distributions.
+
+        Parameters
+        ----------
+        X : np.ndarray
+            Array used to predict our outcome y.
+        Z : np.ndarray
+            Array used to predict our treatment variable t.
+        y : np.ndarray
+            Array of values representing our focal outcome y.
+        t : np.ndarray
+            Array representing the treatment variable.
+        coords : dict
+            Dictionary with coordinate names for named dimensions.
+        priors : dict
+            Dictionary of priors for the model.
+        ppc_sampler : str, optional
+            Sampler for posterior predictive distribution. Can be 'jax',
+            'pymc', or None. Defaults to None, so the user can determine
+            if they wish to spend time sampling the posterior predictive
+            distribution independently.
+
+        Returns
+        -------
+        az.InferenceData
+            InferenceData object containing the samples.
         """
 
         # Ensure random_seed is used in sample_prior_predictive() and
diff --git a/causalpy/skl_models.py b/causalpy/skl_models.py
index 8383dc87..5100ec02 100644
--- a/causalpy/skl_models.py
+++ b/causalpy/skl_models.py
@@ -39,7 +39,16 @@ def calculate_cumulative_impact(self, impact: np.ndarray) -> np.ndarray:
     def print_coefficients(
         self, labels: list[str], round_to: int | None = None
     ) -> None:
-        """Print the coefficients of the model with the corresponding labels."""
+        """Print the coefficients of the model with the corresponding labels.
+
+        Parameters
+        ----------
+        labels : list of str
+            List of strings representing the coefficient names.
+        round_to : int, optional
+            Number of significant figures to round to. Defaults to None,
+            in which case 2 significant figures are used.
+        """
         print("Model coefficients:")
         coef_ = self.get_coeffs()
         # Determine the width of the longest label
diff --git a/causalpy/utils.py b/causalpy/utils.py
index 997c93ba..4d1a60c8 100644
--- a/causalpy/utils.py
+++ b/causalpy/utils.py
@@ -35,15 +35,20 @@ def _series_has_2_levels(series: pd.Series) -> bool:
 
 
 def round_num(n: float, round_to: int | None) -> str:
-    """
-    Return a string representing a number with `round_to` significant figures.
+    """Return a string representing a number with significant figures.
 
     Parameters
     ----------
     n : float
-        number to round
+        Number to round.
     round_to : int, optional
-        number of significant figures
+        Number of significant figures. If None, defaults to 2.
+
+    Returns
+    -------
+    str
+        String representation of the number with specified significant
+        figures.
     """
     sig_figs = _format_sig_figs(n, round_to)
     return f"{n:.{sig_figs}g}"
@@ -69,7 +74,26 @@ def _format_sig_figs(value: float, default: int | None = None) -> int:
 
 
 def convert_to_string(x: Union[float, xr.DataArray], round_to: int | None = 2) -> str:
-    """Utility function which takes in numeric inputs and returns a string."""
+    """Convert numeric inputs to a formatted string representation.
+
+    Parameters
+    ----------
+    x : float or xr.DataArray
+        The numeric value or xarray DataArray to convert.
+    round_to : int, optional
+        Number of significant figures to round to. Defaults to 2.
+
+    Returns
+    -------
+    str
+        Formatted string representation. For floats, returns rounded
+        decimal. For DataArrays, returns mean with 94% credible interval.
+
+    Raises
+    ------
+    ValueError
+        If `x` is neither a float nor an xarray DataArray.
+    """
     if isinstance(x, float):
         # In the case of a float, we return the number rounded to 2 decimal places
         return f"{x:.2f}"
diff --git a/docs/source/_static/interrogate_badge.svg b/docs/source/_static/interrogate_badge.svg
index aa85b1ad..4704ef6c 100644
--- a/docs/source/_static/interrogate_badge.svg
+++ b/docs/source/_static/interrogate_badge.svg
@@ -1,5 +1,5 @@
 <svg width="140" height="20" viewBox="0 0 140 20" version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xml:space="preserve" xmlns:serif="http://www.serif.com/" style="fill-rule:evenodd;clip-rule:evenodd;stroke-linejoin:round;stroke-miterlimit:2;">
-    <title>interrogate: 95.1%</title>
+    <title>interrogate: 95.5%</title>
     <g transform="matrix(1,0,0,1,22,0)">
         <g id="backgrounds" transform="matrix(1.32789,0,0,1,-22.3892,0)">
             <rect x="0" y="0" width="71" height="20" style="fill:rgb(85,85,85);"/>
@@ -12,8 +12,8 @@
     <g fill="#fff" text-anchor="middle" font-family="DejaVu Sans,Verdana,Geneva,sans-serif" font-size="110">
         <text x="590" y="150" fill="#010101" fill-opacity=".3" transform="scale(.1)" textLength="610">interrogate</text>
         <text x="590" y="140" transform="scale(.1)" textLength="610">interrogate</text>
-        <text x="1160" y="150" fill="#010101" fill-opacity=".3" transform="scale(.1)" textLength="370" data-interrogate="result">95.1%</text>
-        <text x="1160" y="140" transform="scale(.1)" textLength="370" data-interrogate="result">95.1%</text>
+        <text x="1160" y="150" fill="#010101" fill-opacity=".3" transform="scale(.1)" textLength="370" data-interrogate="result">95.5%</text>
+        <text x="1160" y="140" transform="scale(.1)" textLength="370" data-interrogate="result">95.5%</text>
     </g>
     <g id="logo-shadow" serif:id="logo shadow" transform="matrix(0.854876,0,0,0.854876,-6.73514,1.732)">
         <g transform="matrix(0.299012,0,0,0.299012,9.70229,-6.68582)">

From 92c791e511d9c410d47fad362bb1367a54d1f7a1 Mon Sep 17 00:00:00 2001
From: juanitorduz <juanitorduz@gmail.com>
Date: Wed, 12 Nov 2025 12:31:15 +0100
Subject: [PATCH 6/6] fix: apply ruff formatting after rebase

---
 causalpy/data/simulate_data.py | 2 --
 1 file changed, 2 deletions(-)

diff --git a/causalpy/data/simulate_data.py b/causalpy/data/simulate_data.py
index ae705059..de253420 100644
--- a/causalpy/data/simulate_data.py
+++ b/causalpy/data/simulate_data.py
@@ -15,8 +15,6 @@
 Functions that generate data sets used in examples
 """
 
-from typing import Any
-
 import numpy as np
 import pandas as pd
 from scipy.stats import dirichlet, gamma, norm, uniform