Address PR #393 R4 P1+P3: bootstrap+placebo regressions + Results docstring

igerber · claude · igerber · commit ad8f6be14d91 · 2026-04-26T16:33:18.000-04:00
P1 fixes — coverage gaps for newly reachable bootstrap+placebo paths:

- test_per_path_placebos_with_trends_linear_bootstrap_inference:
  asserts negative-horizon SE differs between analytical and
  bootstrap fits, proving the placebo bootstrap propagation block
  runs through the first-differenced path.
- test_per_path_placebos_with_trends_linear_bootstrap_nan_consistent:
  n_bootstrap=1 case asserting NaN-consistent inference on negative
  horizons (locks the library-wide NaN-on-invalid contract on this
  newly reachable surface).
- test_per_path_placebos_with_trends_nonparam_bootstrap_inference:
  comparison fit with vs without trends_nonparam under bootstrap +
  placebo; asserts negative-horizon SE differs, proving set_ids
  reaches _collect_path_placebo_bootstrap_inputs.

P3 fix — Results dataclass attribute documentation:
- Added a path_cumulated_event_study attribute entry to
  ChaisemartinDHaultfoeuilleResults attributes docstring (was added
  as a field but missing from the public attribute table).

Co-Authored-By: Claude Opus 4.7 (1M context) &lt;noreply@anthropic.com&gt;
diff --git a/diff_diff/chaisemartin_dhaultfoeuille_results.py b/diff_diff/chaisemartin_dhaultfoeuille_results.py
@@ -418,6 +418,26 @@ class ChaisemartinDHaultfoeuilleResults:
         cohort-sharing SE deviation from R documented for
         ``path_effects``. See REGISTRY.md
         ``Note (Phase 3 by_path ...)`` → "Per-path placebos".
+    path_cumulated_event_study : dict, optional
+        Per-path cumulated level effects ``delta_{path, l} =
+        sum_{l'=1..l} DID^{fd}_{path, l'}`` for ``l = 1..L_max``,
+        keyed by observed treatment trajectory (tuple of int). Inner
+        dict is keyed by horizon directly (no ``"horizons"`` wrapper);
+        each entry holds ``{"effect", "se", "t_stat", "p_value",
+        "conf_int", "n_obs"}``. Populated when ``by_path`` is a
+        positive int AND ``trends_linear=True`` AND ``L_max >= 1``;
+        ``None`` otherwise. Mirrors the global ``linear_trends_effects``
+        cumulation: SE on the cumulated layer is the conservative
+        upper bound (sum of per-horizon component SEs from
+        ``path_effects[path]["horizons"][l]["se"]``, NaN-consistent).
+        Built AFTER bootstrap propagation so the cumulated SE / t / p
+        / CI are derived from the FINAL post-bootstrap per-horizon
+        SEs when ``n_bootstrap > 0``. Surfaced as ``cumulated_effect``
+        / ``cumulated_se`` columns on
+        ``to_dataframe(level="by_path")`` (always-present, NaN-when-
+        None) and as a per-path "Cumulated Level Effects" sub-section
+        in ``summary()``. See REGISTRY.md ``Note (Phase 3 by_path
+        ...)`` → "Per-path linear-trends DID^{fd}".
     path_sup_t_bands : dict, optional
         Per-path joint sup-t simultaneous-band metadata, keyed by
         observed treatment trajectory (tuple of int). Each entry holds
diff --git a/tests/test_chaisemartin_dhaultfoeuille.py b/tests/test_chaisemartin_dhaultfoeuille.py
@@ -7299,6 +7299,115 @@ def test_per_path_placebos_with_trends_linear_present(self):
             "placebo path may have regressed."
         )
 
+    @pytest.mark.slow
+    def test_per_path_placebos_with_trends_linear_bootstrap_inference(self):
+        """Bootstrap-derived inference fields populated on negative-
+        horizon ``path_placebo_event_study`` rows under ``by_path +
+        trends_linear + placebo + n_bootstrap > 0``. Pins the placebo
+        bootstrap collector path that consumes the first-differenced
+        ``Y_mat`` AND the bootstrap propagation block at
+        ``chaisemartin_dhaultfoeuille.py:3097-`` for negative horizons.
+        Without this, a silent regression in the placebo bootstrap
+        propagation would surface analytical SEs on a bootstrap fit.
+        """
+        data = _by_path_data_with_trends_linear()
+        with warnings.catch_warnings():
+            warnings.simplefilter("ignore", UserWarning)
+            est_a = ChaisemartinDHaultfoeuille(
+                drop_larger_lower=False, by_path=3, placebo=True
+            )
+            res_a = est_a.fit(
+                data,
+                outcome="outcome",
+                group="group",
+                time="period",
+                treatment="treatment",
+                trends_linear=True,
+                L_max=3,
+            )
+            est_b = ChaisemartinDHaultfoeuille(
+                drop_larger_lower=False,
+                by_path=3,
+                placebo=True,
+                n_bootstrap=200,
+                seed=42,
+            )
+            res_b = est_b.fit(
+                data,
+                outcome="outcome",
+                group="group",
+                time="period",
+                treatment="treatment",
+                trends_linear=True,
+                L_max=3,
+            )
+        # Negative-horizon placebo rows must exist and carry bootstrap-
+        # derived inference. Verify by comparing analytical-only fit's
+        # SEs to bootstrap-fit's SEs on the same negative-horizon
+        # entries: bootstrap should differ (non-bit-identical) since
+        # the propagation block overwrites SE / p_value / conf_int.
+        assert res_b.path_placebo_event_study is not None
+        any_se_diff = False
+        any_finite = False
+        for path, lag_dict in res_b.path_placebo_event_study.items():
+            for lag_k, vals_b in lag_dict.items():
+                if not np.isfinite(vals_b["se"]):
+                    continue
+                any_finite = True
+                vals_a = res_a.path_placebo_event_study.get(path, {}).get(lag_k)
+                if vals_a is None or not np.isfinite(vals_a["se"]):
+                    continue
+                if abs(vals_b["se"] - vals_a["se"]) > 1e-10:
+                    any_se_diff = True
+                    break
+            if any_se_diff:
+                break
+        assert any_finite, "No finite negative-horizon bootstrap SEs surfaced"
+        assert any_se_diff, (
+            "Bootstrap fit produced bit-identical SEs to analytical fit on "
+            "every negative-horizon placebo cell; the placebo bootstrap "
+            "propagation block under trends_linear may not be running."
+        )
+
+    @pytest.mark.slow
+    def test_per_path_placebos_with_trends_linear_bootstrap_nan_consistent(self):
+        """``n_bootstrap=1`` produces NaN-consistent inference on
+        negative-horizon ``path_placebo_event_study`` rows under
+        ``by_path + trends_linear + placebo``. Pins the library-wide
+        NaN-on-invalid bootstrap contract on the new placebo path.
+        """
+        data = _by_path_data_with_trends_linear()
+        with warnings.catch_warnings():
+            warnings.simplefilter("ignore", (UserWarning, RuntimeWarning))
+            est = ChaisemartinDHaultfoeuille(
+                drop_larger_lower=False,
+                by_path=3,
+                placebo=True,
+                n_bootstrap=1,
+                seed=42,
+            )
+            res = est.fit(
+                data,
+                outcome="outcome",
+                group="group",
+                time="period",
+                treatment="treatment",
+                trends_linear=True,
+                L_max=3,
+            )
+        assert res.path_placebo_event_study is not None
+        # n_bootstrap=1 → degenerate bootstrap distribution → NaN SE /
+        # p_value / conf_int on every negative-horizon entry.
+        for path, lag_dict in res.path_placebo_event_study.items():
+            for lag_k, vals in lag_dict.items():
+                assert not np.isfinite(vals["se"]), (
+                    f"path={path} lag={lag_k}: SE finite ({vals['se']}) "
+                    "under n_bootstrap=1; expected NaN"
+                )
+                assert not np.isfinite(vals["p_value"]), (
+                    f"path={path} lag={lag_k}: p_value finite under n_bootstrap=1"
+                )
+
     @pytest.mark.slow
     def test_sup_t_bands_with_trends_linear_finite_crit(self):
         """Per-path joint sup-t bands populated under ``by_path +
@@ -7851,3 +7960,84 @@ def test_sup_t_bands_with_trends_nonparam_finite_crit(self):
             "No positive-horizon cband rows populated under "
             "trends_nonparam + bootstrap"
         )
+
+    @pytest.mark.slow
+    def test_per_path_placebos_with_trends_nonparam_bootstrap_inference(self):
+        """Bootstrap-derived inference fields populated on negative-
+        horizon ``path_placebo_event_study`` rows under ``by_path +
+        trends_nonparam + placebo + n_bootstrap > 0``.
+
+        Pins the ``set_ids`` threading into
+        ``_collect_path_placebo_bootstrap_inputs`` (line 5963 in the
+        diff): without that threading, the placebo bootstrap collector
+        would re-compute the per-group placebo IF with set_ids=None,
+        bypassing the set-restricted control pool. We verify by
+        comparing two bootstrap fits — one with trends_nonparam, one
+        without — and asserting at least one negative-horizon SE
+        differs (the set restriction must propagate through the
+        placebo bootstrap path) AND remains finite.
+        """
+        data = _by_path_data_with_trends_nonparam()
+        with warnings.catch_warnings():
+            warnings.simplefilter("ignore", UserWarning)
+            est_no_set = ChaisemartinDHaultfoeuille(
+                drop_larger_lower=False,
+                by_path=3,
+                placebo=True,
+                n_bootstrap=200,
+                seed=42,
+            )
+            res_no = est_no_set.fit(
+                data,
+                outcome="outcome",
+                group="group",
+                time="period",
+                treatment="treatment",
+                L_max=3,
+            )
+            est_set = ChaisemartinDHaultfoeuille(
+                drop_larger_lower=False,
+                by_path=3,
+                placebo=True,
+                n_bootstrap=200,
+                seed=42,
+            )
+            res_set = est_set.fit(
+                data,
+                outcome="outcome",
+                group="group",
+                time="period",
+                treatment="treatment",
+                trends_nonparam="state",
+                L_max=3,
+            )
+        assert res_set.path_placebo_event_study is not None
+        assert res_no.path_placebo_event_study is not None
+        any_diff = False
+        any_finite = False
+        for path, lag_dict in res_set.path_placebo_event_study.items():
+            for lag_k, vals_set in lag_dict.items():
+                if not np.isfinite(vals_set["se"]):
+                    continue
+                any_finite = True
+                vals_no = res_no.path_placebo_event_study.get(path, {}).get(
+                    lag_k
+                )
+                if vals_no is None or not np.isfinite(vals_no["se"]):
+                    continue
+                # Set restriction shrinks the control pool; with the
+                # same seed, the bootstrap distribution should differ.
+                if abs(vals_set["se"] - vals_no["se"]) > 1e-10:
+                    any_diff = True
+                    break
+            if any_diff:
+                break
+        assert any_finite, (
+            "No finite negative-horizon bootstrap SEs surfaced under "
+            "trends_nonparam + placebo + bootstrap"
+        )
+        assert any_diff, (
+            "Bootstrap placebo SEs are bit-identical with vs without "
+            "trends_nonparam restriction; set_ids may not be reaching "
+            "the per-path placebo bootstrap collector."
+        )