Address PR #364 AI review R5: placebo_event_study NaN-on-invalid parity

igerber · claude · igerber · commit efb5252ca2b1 · 2026-04-24T18:53:38.000-04:00
P1: the NaN-on-invalid-bootstrap pattern was applied to overall /
joiners / leavers / event_study_effects / path_effects, but the
parallel dynamic-placebo propagation block at
chaisemartin_dhaultfoeuille.py:3050 kept the pre-fix pattern
(`if np.isfinite(bs_se): overwrite else leave analytical intact`).

Dynamic placebo rows surface on `results.placebo_event_study` and in
`results.to_dataframe(level="event_study")` negative-horizon rows; a
non-finite placebo bootstrap SE would silently leave analytical
`se / t_stat / p_value / conf_int` in place, mixing bootstrap- and
analytical-contract semantics in the same rendered output.

Fix: add the `else -&gt; NaN tuple` branch to the placebo_event_study
propagation block, mirroring the five other surfaces above.

Regression test
`test_nan_contract_extends_to_placebo_event_study_horizons` fits
`n_bootstrap=1` on a T=5 panel with placebos enabled and asserts that
every `placebo_event_study[-lag]` entry and every negative-horizon
row in `to_dataframe(level="event_study")` has NaN `se / t_stat /
p_value / conf_int_{lower,upper}`.

Full dCDH regression: 215 pass. TestByPathBootstrap: 15 pass under
-m slow.

Co-Authored-By: Claude Opus 4.7 (1M context) &lt;noreply@anthropic.com&gt;
diff --git a/diff_diff/chaisemartin_dhaultfoeuille.py b/diff_diff/chaisemartin_dhaultfoeuille.py
@@ -3034,8 +3034,20 @@ def fit(
                         if bootstrap_results.placebo_horizon_p_values
                         else None
                     )
+                    # Same bootstrap-contract rule as overall / joiners /
+                    # leavers / event_study_effects / path_effects above:
+                    # once the caller opts into n_bootstrap > 0, the
+                    # bootstrap output replaces analytical inference on
+                    # this surface regardless of outcome. Non-finite
+                    # bootstrap SE writes NaN to the full inference tuple
+                    # rather than silently leaving analytical values in
+                    # place — that would mix bootstrap-contract and
+                    # analytical-contract semantics in the same rendered
+                    # output (dynamic placebo rows appear in
+                    # `results.to_dataframe(level="event_study")` alongside
+                    # positive-horizon entries).
+                    eff = placebo_event_study_dict[neg_key]["effect"]
                     if bs_se is not None and np.isfinite(bs_se):
-                        eff = placebo_event_study_dict[neg_key]["effect"]
                         placebo_event_study_dict[neg_key]["se"] = bs_se
                         placebo_event_study_dict[neg_key]["p_value"] = (
                             bs_p if bs_p is not None else np.nan
@@ -3049,6 +3061,13 @@ def fit(
                             alpha=self.alpha,
                             df=_inference_df(_df_survey, resolved_survey),
                         )[0]
+                    else:
+                        placebo_event_study_dict[neg_key]["se"] = np.nan
+                        placebo_event_study_dict[neg_key]["p_value"] = np.nan
+                        placebo_event_study_dict[neg_key]["conf_int"] = (
+                            np.nan, np.nan,
+                        )
+                        placebo_event_study_dict[neg_key]["t_stat"] = np.nan
 
         # Phase 2: build normalized_effects with SE
         normalized_effects_out: Optional[Dict[int, Dict[str, Any]]] = None
diff --git a/tests/test_chaisemartin_dhaultfoeuille.py b/tests/test_chaisemartin_dhaultfoeuille.py
@@ -4593,6 +4593,86 @@ def test_overflow_warning_fires_exactly_once_under_bootstrap(self):
             f"Messages: {[str(w.message) for w in overflow_warnings]}"
         )
 
+    def test_nan_contract_extends_to_placebo_event_study_horizons(self):
+        """
+        Dynamic placebo horizons go through their own bootstrap
+        propagation block at
+        ``chaisemartin_dhaultfoeuille.py::placebo_event_study_dict``
+        and surface in ``results.placebo_event_study`` and
+        ``results.to_dataframe(level="event_study")`` (negative-horizon
+        rows). Pin the same NaN-on-invalid contract as the positive
+        horizons: ``n_bootstrap=1`` on a panel with valid placebo
+        eligibility must yield NaN SE / t / p / CI on every placebo
+        entry, not the analytical values populated in the build step
+        before bootstrap propagation.
+        """
+        # Longer panel (T=5) so placebo horizons have enough cells.
+        rng = np.random.default_rng(42)
+        rows = []
+        for g in (1, 2, 3, 4, 5, 6):
+            for t in range(5):
+                d = 1 if t >= 2 else 0
+                y = d * 2.0 + rng.normal(0, 0.1)
+                rows.append({"group": g, "period": t, "treatment": d, "outcome": y})
+        for g in (7, 8):
+            for t in range(5):
+                y = rng.normal(0, 0.1)
+                rows.append({"group": g, "period": t, "treatment": 0, "outcome": y})
+        data = pd.DataFrame(rows)
+
+        with warnings.catch_warnings():
+            warnings.simplefilter("ignore")
+            est = ChaisemartinDHaultfoeuille(
+                n_bootstrap=1,  # forces non-finite bootstrap SE
+                seed=42,
+                twfe_diagnostic=False,
+                placebo=True,  # enable placebo surface
+            )
+            res = est.fit(
+                data,
+                outcome="outcome",
+                group="group",
+                time="period",
+                treatment="treatment",
+                L_max=2,
+            )
+
+        # If the panel + L_max produced placebo horizons, each must be
+        # NaN-consistent. If no placebos were produced, skip — the test
+        # relies on having at least one placebo row to exercise the
+        # propagation path.
+        if res.placebo_event_study is None or not res.placebo_event_study:
+            pytest.skip(
+                "placebo_event_study empty on this panel; cannot exercise "
+                "the placebo bootstrap propagation path"
+            )
+        for lag_key, entry in res.placebo_event_study.items():
+            assert np.isnan(entry["se"]), (
+                f"placebo_event_study[{lag_key}].se must be NaN under "
+                f"n_bootstrap=1; got {entry['se']}"
+            )
+            assert np.isnan(entry["t_stat"])
+            assert np.isnan(entry["p_value"])
+            lo, hi = entry["conf_int"]
+            assert np.isnan(lo) and np.isnan(hi)
+            # Effect may be NaN legitimately when N_pl_l == 0 for this
+            # lag (panel/horizon eligibility, not a bootstrap artifact).
+            # We only assert the inference-field NaN contract here.
+
+        # `to_dataframe(level="event_study")` surfaces these rows too.
+        # Negative-horizon rows must also show NaN in the inference
+        # columns.
+        df_es = res.to_dataframe(level="event_study")
+        negative_rows = df_es[df_es["horizon"] < 0]
+        if len(negative_rows) > 0:
+            for col in ("se", "t_stat", "p_value",
+                        "conf_int_lower", "conf_int_upper"):
+                assert negative_rows[col].isna().all(), (
+                    f"to_dataframe(level='event_study') negative-horizon "
+                    f"column {col!r} must be NaN under n_bootstrap=1; "
+                    f"got {negative_rows[col].tolist()}"
+                )
+
     def test_summary_footer_mixed_validity_surfaces_live_targets(self):
         """
         Mixed-validity case: overall_se / event_study_ses degenerate to