david26694 · LGonzalezGomez · Dec 17, 2024 · Dec 15, 2024 · Dec 15, 2024 · Dec 15, 2024
diff --git a/README.md b/README.md
@@ -263,6 +263,7 @@ The library offers the following classes:
     * `PairedTTestClusteredAnalysis`: to run a paired t-test on aggregated data for clusters
     * `ClusteredOLSAnalysis`: to run OLS analysis on the results of a clustered design
     * `OLSAnalysis`: to run OLS analysis for non-clustered data
+    * `DeltaMethodAnalysis`: to run Delta Method Analysis for clustered designs
     * `TargetAggregation`: to add pre-experimental data of the outcome to reduce variance
     * `SyntheticControlAnalysis`: to run synthetic control analysis
 * Regarding experiment analysis workflow:

diff --git a/cluster_experiments/__init__.py b/cluster_experiments/__init__.py
@@ -1,6 +1,7 @@
 from cluster_experiments.cupac import EmptyRegressor, TargetAggregation
 from cluster_experiments.experiment_analysis import (
     ClusteredOLSAnalysis,
+    DeltaMethodAnalysis,
     ExperimentAnalysis,
     GeeExperimentAnalysis,
     MLMExperimentAnalysis,
@@ -45,6 +46,7 @@
 __all__ = [
     "ExperimentAnalysis",
     "GeeExperimentAnalysis",
+    "DeltaMethodAnalysis",
     "OLSAnalysis",
     "BinaryPerturbator",
     "Perturbator",

diff --git a/cluster_experiments/experiment_analysis.py b/cluster_experiments/experiment_analysis.py
@@ -1,4 +1,5 @@
 import logging
+import warnings
 from abc import ABC, abstractmethod
 from dataclasses import dataclass
 from typing import Dict, List, Optional
@@ -7,10 +8,10 @@
 import pandas as pd
 import statsmodels.api as sm
 from pandas.api.types import is_numeric_dtype
-from scipy.stats import ttest_ind, ttest_rel
+from scipy.stats import norm, ttest_ind, ttest_rel
 
 from cluster_experiments.synthetic_control_utils import get_w
-from cluster_experiments.utils import HypothesisEntries
+from cluster_experiments.utils import HypothesisEntries, ModelResults
 
 
 @dataclass
@@ -1147,7 +1148,8 @@ def pvalue_based_on_hypothesis(
 
     def _get_treatment_cluster(self, df: pd.DataFrame) -> str:
         """Returns the first treatment cluster. The current implementation of Synthetic Control only accepts one treatment cluster.
-        This will be left inside Synthetic class because it doesn't apply for other analyses"""
+        This will be left inside Synthetic class because it doesn't apply for other analyses
+        """
         treatment_df = df[df[self.treatment_col] == 1]
         treatment_cluster = self._get_cluster_column(treatment_df).unique()[0]
         return treatment_cluster
@@ -1204,3 +1206,184 @@ def _split_pre_experiment_df(self, df: pd.DataFrame):
         pre_experiment_df = df[(df[self.time_col] <= self.intervention_date)]
         df = df[(df[self.time_col] > self.intervention_date)]
         return df, pre_experiment_df
+
+
+class DeltaMethodAnalysis(ExperimentAnalysis):
+    def __init__(
+        self,
+        cluster_cols: Optional[List[str]] = None,
+        target_col: str = "target",
+        scale_col: str = "scale",
+        treatment_col: str = "treatment",
+        treatment: str = "B",
+        covariates: Optional[List[str]] = None,
+        hypothesis: str = "two-sided",
+    ):
+        """
+        Class to run the Delta Method approximation for estimating the treatment effect on a ratio metric (target/scale) under a clustered design.
+        The analysis is done on the aggregated data at the cluster level, making computation more efficient.
+
+        Arguments:
+            cluster_cols: list of columns to use as clusters. Not available for the CUPED method.
+            target_col: name of the column containing the variable to measure (the numerator of the ratio).
+            scale_col: name of the column containing the scale variable (the denominator of the ratio).
+            treatment_col: name of the column containing the treatment variable.
+            treatment: name of the treatment to use as the treated group.
+            covariates: list of columns to use as covariates.
+            ratio_covariates: list of tuples of columns to use as covariates for ratio metrics. First element is the numerator column, second element is the denominator column.
+            hypothesis: one of "two-sided", "less", "greater" indicating the alternative hypothesis.
+
+            Usage:
+            ```python
+            import pandas as pd
+
+            from cluster_experiments.experiment_analysis import DeltaMethodAnalysis
+
+            df = pd.DataFrame({
+                'x': [1, 2, 3, 0, 0, 1] * 2,
+                'y': [2, 2, 5, 1, 1, 1] * 2,
+                'treatment': ["A"] * 6 + ["B"] * 6,
+                'cluster': [1, 2, 3, 1, 2, 3] * 2,
+            })
+
+            DeltaMethodAnalysis(
+                cluster_cols=['cluster'],
+                target_col='x',
+                scale_col='y'
+            ).get_pvalue(df)
+            ```
+        """
+
+        super().__init__(
+            target_col=target_col,
+            treatment_col=treatment_col,
+            cluster_cols=cluster_cols,
+            treatment=treatment,
+            covariates=covariates,
+            hypothesis=hypothesis,
+        )
+        self.scale_col = scale_col
+        self.cluster_cols = cluster_cols or []
+
+        if covariates is not None:
+            warnings.warn(
+                "Covariates are not supported in the Delta Method approximation for the time being. They will be ignored."
+            )
+        if cluster_cols is None:
+            raise ValueError(
+                "cluster_cols must be provided for the Delta Method analysis"
+            )
+
+    def _aggregate_to_cluster(self, df: pd.DataFrame) -> pd.DataFrame:
+        """
+        Returns an aggreegated dataframe of the target and scale variables at the cluster (and treatment) level.
+
+        Arguments:
+            df: dataframe containing the data to analyze
+        """
+        group_cols = self.cluster_cols + [self.treatment_col]
+        aggregate_df = df.groupby(by=group_cols, as_index=False).agg(
+            {self.target_col: "sum", self.scale_col: "sum"}
+        )
+        return aggregate_df
+
+    def _get_group_mean_and_variance(self, df: pd.DataFrame) -> tuple[float, float]:
+        """
+        Returns the mean and variance of the ratio metric (target/scale) as estimated by the delta method for a given group (treatment).
+
+        Arguments:
+            df: dataframe containing the data to analyze.
+        """
+        df = self._aggregate_to_cluster(df)
+        group_size = len(df)
+
+        if group_size < 1000:
+            self.__warn_small_group_size()
+
+        target_mean, scale_mean = df.loc[:, [self.target_col, self.scale_col]].mean()
+        target_variance, scale_variance = df.loc[
+            :, [self.target_col, self.scale_col]
+        ].var()
+        target_sum, scale_sum = df.loc[:, [self.target_col, self.scale_col]].sum()
+
+        target_scale_cov = df.loc[:, self.target_col].cov(df.loc[:, self.scale_col])
+
+        group_mean = target_sum / scale_sum
+        group_variance = (
+            (1 / (scale_mean**2)) * target_variance
+            + (target_mean**2) / (scale_mean**4) * scale_variance
+            - (2 * target_mean) / (scale_mean**3) * target_scale_cov
+        ) / group_size
+        return group_mean, group_variance
+
+    def _get_mean_standard_error(self, df: pd.DataFrame) -> tuple[float, float]:
+        """
+        Returns mean and variance of the ratio metric (target/scale) for a given cluster (i.e. user) computed using the Delta Method.
+        Variance reduction is used if covariates are given.
+        """
+
+        is_treatment = df[self.treatment_col] == 1
+        treat_mean, treat_var = self._get_group_mean_and_variance(df[is_treatment])
+        ctrl_mean, ctrl_var = self._get_group_mean_and_variance(df[~is_treatment])
+
+        mean_diff = treat_mean - ctrl_mean
+        standard_error = np.sqrt(treat_var + ctrl_var)
+
+        return mean_diff, standard_error
+
+    def analysis_pvalue(self, df: pd.DataFrame) -> float:
+        """
+        Returns the p-value of the analysis.
+
+        Arguments:
+            df: dataframe containing the data to analyze.
+        """
+
+        mean_diff, standard_error = self._get_mean_standard_error(df)
+
+        z_score = mean_diff / standard_error
+        p_value = 2 * (1 - norm.cdf(abs(z_score)))
+
+        results_delta = ModelResults(
+            params={self.treatment_col: mean_diff},
+            pvalues={self.treatment_col: p_value},
+        )
+
+        p_value = self.pvalue_based_on_hypothesis(results_delta)
+
+        return p_value
+
+    def analysis_point_estimate(self, df: pd.DataFrame) -> float:
+        """Returns the point estimate of the analysis
+        Arguments:
+            df: dataframe containing the data to analyze
+            verbose (Optional): bool, prints the regression summary if True
+        """
+        mean_diff, _standard_error = self._get_mean_standard_error(df)
+        return mean_diff
+
+    def analysis_standard_error(self, df: pd.DataFrame) -> float:
+        """Returns the standard error of the analysis
+        Arguments:
+            df: dataframe containing the data to analyze
+            verbose (Optional): bool, prints the regression summary if True
+        """
+        _mean_diff, standard_error = self._get_mean_standard_error(df)
+        return standard_error
+
+    @classmethod
+    def from_config(cls, config):
+        """Creates a DeltaMethodAnalysis object from a PowerConfig object"""
+        return cls(
+            cluster_cols=config.cluster_cols,
+            target_col=config.target_col,
+            scale_col=config.scale_col,
+            treatment_col=config.treatment_col,
+            treatment=config.treatment,
+            hypothesis=config.hypothesis,
+        )
+
+    def __warn_small_group_size(self):
+        warnings.warn(
+            "Delta Method approximation may not be accurate for small group sizes"
+        )
diff --git a/cluster_experiments/power_config.py b/cluster_experiments/power_config.py
@@ -6,6 +6,7 @@
 from cluster_experiments.cupac import EmptyRegressor, TargetAggregation
 from cluster_experiments.experiment_analysis import (
     ClusteredOLSAnalysis,
+    DeltaMethodAnalysis,
     GeeExperimentAnalysis,
     MLMExperimentAnalysis,
     OLSAnalysis,
@@ -38,6 +39,10 @@ class MissingArgumentError(ValueError):
     pass
 
 
+class UnexpectedArgumentError(ValueError):
+    pass
+
+
 @dataclass(eq=True)
 class PowerConfig:
     """
@@ -105,6 +110,7 @@ class PowerConfig:
 
     # optional mappings
     cupac_model: str = ""
+    scale_col: Optional[str] = None
 
     # Shared
     target_col: str = "target"
@@ -196,6 +202,10 @@ def __post_init__(self):
         if "segmented" in self.perturbator:
             self._raise_error_if_missing("segment_cols", "perturbator")
 
+        if "delta" not in self.analysis:
+            if self.scale_col is not None:
+                self._raise_error_if_missing("scale_col", "analysis")
+
     def _are_different(self, arg1, arg2) -> bool:
         return arg1 != arg2
 
@@ -214,6 +224,13 @@ def _raise_error_if_missing(self, attr, other_attr):
                 f"{other_attr} = {getattr(self, other_attr)}."
             )
 
+    def _raise_error_if_present(self, attr, other_attr):
+        if getattr(self, attr) is None:
+            raise UnexpectedArgumentError(
+                f"{attr} is not expected when using "
+                f"{other_attr} = {getattr(self, other_attr)}."
+            )
+
 
 perturbator_mapping = {
     "binary": BinaryPerturbator,
@@ -254,6 +271,7 @@ def _raise_error_if_missing(self, attr, other_attr):
     "ttest_clustered": TTestClusteredAnalysis,
     "paired_ttest_clustered": PairedTTestClusteredAnalysis,
     "mlm": MLMExperimentAnalysis,
+    "delta": DeltaMethodAnalysis,
 }
 
 cupac_model_mapping = {"": EmptyRegressor, "mean_cupac_model": TargetAggregation}
diff --git a/cluster_experiments/utils.py b/cluster_experiments/utils.py
@@ -1,4 +1,5 @@
 from enum import Enum
+from typing import Dict
 
 
 def _original_time_column(time_col: str) -> str:
@@ -26,3 +27,9 @@ class HypothesisEntries(Enum):
     TWO_SIDED = "two-sided"
     LESS = "less"
     GREATER = "greater"
+
+
+class ModelResults:
+    def __init__(self, params: Dict, pvalues: Dict):
+        self.params = params
+        self.pvalues = pvalues