Fix TripleDiff TSL double-weighting, rewrite CS reg covariate survey IF

igerber · claude · igerber · commit 6165bc4d24df · 2026-03-23T07:26:28.000-04:00
- TripleDifference: divide out survey weights from IF before passing to
  compute_survey_vcov, since Riesz representers already incorporate weights
  and TSL would multiply by weights again
- CallawaySantAnna _outcome_regression: rewrite survey covariate IF to follow
  DRDID panel OR structure — all terms consistently scaled by 1/sw_t_sum,
  nuisance correction divided by sw_t_sum for correct normalization

Co-Authored-By: Claude Opus 4.6 (1M context) &lt;noreply@anthropic.com&gt;
diff --git a/diff_diff/staggered.py b/diff_diff/staggered.py
@@ -1603,43 +1603,48 @@ def _outcome_regression(
             treated_residuals = treated_change - predicted_control
 
             if sw_treated is not None:
-                sw_t_norm = sw_treated / np.sum(sw_treated)
-                sw_c_norm = sw_control / np.sum(sw_control)
+                sw_t_sum = float(np.sum(sw_treated))
+                sw_t_norm = sw_treated / sw_t_sum
                 att = float(np.sum(sw_t_norm * treated_residuals))
 
-                # --- Regression nuisance IF correction ---
-                # Account for uncertainty in beta estimation
+                # --- DRDID panel OR influence function (survey-weighted) ---
+                # Following Sant'Anna & Zhao (2020) Theorem 3.1 for the OR estimator.
+                # All IF terms are scaled by 1/sw_t_sum so that sum(IF^2) gives V(ATT).
                 X_c = np.column_stack([np.ones(n_c), X_control])
                 X_t = np.column_stack([np.ones(n_t), X_treated])
 
-                # Weighted bread: (X'WX)^{-1}
+                # Treated component: w_i * (ΔY_i - m(X_i) - ATT) / sum(w_treated)
+                inf_treated = (sw_treated / sw_t_sum) * (treated_residuals - att)
+
+                # Control outcome-regression component
+                predicted_c = np.dot(X_c, beta)
+                inf_control_or = -(sw_control / sw_t_sum) * (control_change - predicted_c)
+
+                # Regression nuisance IF correction (accounts for beta estimation)
+                # Hessian of WLS: H = X_c' W_c X_c
                 XWX = X_c.T @ (X_c * sw_control[:, None])
                 try:
                     XWX_inv = np.linalg.solve(XWX, np.eye(XWX.shape[0]))
                 except np.linalg.LinAlgError:
                     XWX_inv = np.linalg.lstsq(XWX, np.eye(XWX.shape[0]), rcond=None)[0]
 
-                # Per-control regression score: w_i * x_i * resid_i
-                resid_c = control_change - X_c @ beta
+                # Per-control score: w_i * x_i * (y_i - x_i'beta)
+                resid_c = control_change - predicted_c
                 score_c = X_c * (sw_control * resid_c)[:, None]
-                asy_lin_rep_reg = score_c @ XWX_inv  # shape (n_c, p)
+                asy_lin_rep_reg = score_c @ XWX_inv  # (n_c, p)
 
-                # Weighted treated covariate mean
-                X_treated_mean_w = np.average(X_t, axis=0, weights=sw_treated)
+                # Projection direction: survey-weighted treated covariate mean
+                X_treated_mean_w = np.sum(X_t * sw_treated[:, None], axis=0) / sw_t_sum
 
-                # Regression IF correction for control observations
-                inf_control_reg_corr = asy_lin_rep_reg @ X_treated_mean_w
+                # Correction: how beta uncertainty affects ATT
+                inf_control_reg_corr = (asy_lin_rep_reg @ X_treated_mean_w) / sw_t_sum
 
-                # Influence function (survey-weighted)
-                inf_treated = sw_t_norm * (treated_residuals - att)
-                inf_control = (
-                    -sw_c_norm * (control_change - np.dot(X_c, beta)) + inf_control_reg_corr
-                )
+                inf_control = inf_control_or + inf_control_reg_corr
                 inf_func = np.concatenate([inf_treated, inf_control])
 
                 # SE from influence function variance
-                var_psi = np.sum(inf_treated**2) + np.sum(inf_control**2)
-                se = float(np.sqrt(var_psi)) if var_psi > 0 else 0.0
+                se = float(np.sqrt(np.sum(inf_func**2)))
+                se = se if se > 0 else 0.0
             else:
                 att = float(np.mean(treated_residuals))
 
diff --git a/diff_diff/triple_diff.py b/diff_diff/triple_diff.py
@@ -1077,11 +1077,18 @@ def _estimate_ddd_decomposition(
 
         if resolved_survey is not None:
             # Survey-weighted SE via TSL on the combined influence function.
-            # Treat the IF as a single-parameter score vector:
-            #   compute_survey_vcov(ones, IF, resolved) gives V(ATT).
+            # The pairwise IFs already incorporate survey weights (via weighted
+            # Riesz representers), but compute_survey_vcov multiplies by weights
+            # again internally. Divide out the survey weights to get the
+            # unweighted IF that TSL will correctly re-weight.
             from diff_diff.survey import compute_survey_vcov
 
-            vcov_survey = compute_survey_vcov(np.ones((n, 1)), inf_func, resolved_survey)
+            inf_for_tsl = inf_func.copy()
+            sw = survey_weights
+            if sw is not None:
+                nz = sw > 0
+                inf_for_tsl[nz] = inf_for_tsl[nz] / sw[nz]
+            vcov_survey = compute_survey_vcov(np.ones((n, 1)), inf_for_tsl, resolved_survey)
             se = float(np.sqrt(vcov_survey[0, 0]))
         elif self._cluster_ids is not None:
             # Cluster-robust SE: sum IF within clusters, then Liang-Zeger variance