Filter NaN cells in bootstrap aggregation paths, add bootstrap NaN test, extend validator group fields

igerber · claude · igerber · commit 909cf05b2a18 · 2026-03-14T19:21:12.000-04:00
Co-Authored-By: Claude Opus 4.6 (1M context) &lt;noreply@anthropic.com&gt;
diff --git a/benchmarks/speed_review/baseline_results.json b/benchmarks/speed_review/baseline_results.json
@@ -414,15 +414,33 @@
     "group_effects": {
       "3": {
         "effect": 1.9301904330043325,
-        "se": 0.030438318925920818
+        "se": 0.030438318925920818,
+        "t_stat": 63.41317461394397,
+        "p_value": 0.005,
+        "conf_int": [
+          1.8702219368960384,
+          1.9861420614466454
+        ]
       },
       "5": {
         "effect": 1.9809149332576672,
-        "se": 0.03170174036975451
+        "se": 0.03170174036975451,
+        "t_stat": 62.48599951148382,
+        "p_value": 0.005,
+        "conf_int": [
+          1.9184994180296897,
+          2.0357338459955687
+        ]
       },
       "7": {
         "effect": 1.9717890565347787,
-        "se": 0.03344476401759643
+        "se": 0.03344476401759643,
+        "t_stat": 58.956584519399,
+        "p_value": 0.005,
+        "conf_int": [
+          1.9113592178120258,
+          2.0361181246440454
+        ]
       }
     }
   },
@@ -841,15 +859,33 @@
     "group_effects": {
       "3": {
         "effect": 1.9295320405205874,
-        "se": 0.03044125859655524
+        "se": 0.03044125859655524,
+        "t_stat": 63.38542259678234,
+        "p_value": 0.005,
+        "conf_int": [
+          1.8695941117699424,
+          1.9867835997412717
+        ]
       },
       "5": {
         "effect": 1.980830114174799,
-        "se": 0.0316586783231788
+        "se": 0.0316586783231788,
+        "t_stat": 62.568313621751564,
+        "p_value": 0.005,
+        "conf_int": [
+          1.9193890597593606,
+          2.0362551053682205
+        ]
       },
       "7": {
         "effect": 1.9724360751947247,
-        "se": 0.03346783119193577
+        "se": 0.03346783119193577,
+        "t_stat": 58.93528217836812,
+        "p_value": 0.005,
+        "conf_int": [
+          1.912440579136104,
+          2.036883663702173
+        ]
       }
     }
   },
@@ -1268,15 +1304,33 @@
     "group_effects": {
       "3": {
         "effect": 1.9294692278922927,
-        "se": 0.030613393479888402
+        "se": 0.030613393479888402,
+        "t_stat": 63.02696331786496,
+        "p_value": 0.005,
+        "conf_int": [
+          1.8693199149275344,
+          1.983526736406974
+        ]
       },
       "5": {
         "effect": 1.9808312690492889,
-        "se": 0.03170591980009046
+        "se": 0.03170591980009046,
+        "t_stat": 62.47512393706482,
+        "p_value": 0.005,
+        "conf_int": [
+          1.9183357288880067,
+          2.036631351864895
+        ]
       },
       "7": {
         "effect": 1.9738890151454458,
-        "se": 0.03333757547853297
+        "se": 0.03333757547853297,
+        "t_stat": 59.20913524189814,
+        "p_value": 0.005,
+        "conf_int": [
+          1.912612275253619,
+          2.036232874071883
+        ]
       }
     }
   },
@@ -1695,15 +1749,33 @@
     "group_effects": {
       "3": {
         "effect": 1.9295291363580418,
-        "se": 0.030432814553369162
+        "se": 0.030432814553369162,
+        "t_stat": 63.40291440919082,
+        "p_value": 0.005,
+        "conf_int": [
+          1.869928417389561,
+          1.9864120974980581
+        ]
       },
       "5": {
         "effect": 1.9808298091482444,
-        "se": 0.03166813271404776
+        "se": 0.03166813271404776,
+        "t_stat": 62.54962447689763,
+        "p_value": 0.005,
+        "conf_int": [
+          1.9193431683117772,
+          2.0362183499128976
+        ]
       },
       "7": {
         "effect": 1.9724482314870557,
-        "se": 0.03348899468270557
+        "se": 0.03348899468270557,
+        "t_stat": 58.89840080824135,
+        "p_value": 0.005,
+        "conf_int": [
+          1.9113054655520512,
+          2.0358791270186636
+        ]
       }
     }
   },
@@ -2122,15 +2194,33 @@
     "group_effects": {
       "3": {
         "effect": 1.9295131516250037,
-        "se": 0.030428651624796504
+        "se": 0.030428651624796504,
+        "t_stat": 63.41106321164199,
+        "p_value": 0.005,
+        "conf_int": [
+          1.8693318914387955,
+          1.9852891590817527
+        ]
       },
       "5": {
         "effect": 1.980829710949667,
-        "se": 0.031711555960950315
+        "se": 0.031711555960950315,
+        "t_stat": 62.463970969726795,
+        "p_value": 0.005,
+        "conf_int": [
+          1.9183682933830388,
+          2.035608652828243
+        ]
       },
       "7": {
         "effect": 1.972400906646088,
-        "se": 0.033466935554797926
+        "se": 0.033466935554797926,
+        "t_stat": 58.93580855099589,
+        "p_value": 0.005,
+        "conf_int": [
+          1.9108155783646885,
+          2.035952061830552
+        ]
       }
     }
   },
@@ -2549,15 +2639,33 @@
     "group_effects": {
       "3": {
         "effect": 1.9379600572395599,
-        "se": 0.027359714676020434
+        "se": 0.027359714676020434,
+        "t_stat": 70.8326121155823,
+        "p_value": 0.005,
+        "conf_int": [
+          1.8889964928323424,
+          1.9847938462368524
+        ]
       },
       "5": {
         "effect": 1.9776177086894955,
-        "se": 0.029511266225510993
+        "se": 0.029511266225510993,
+        "t_stat": 67.01229603560505,
+        "p_value": 0.005,
+        "conf_int": [
+          1.9223093399752835,
+          2.0294569469461097
+        ]
       },
       "7": {
         "effect": 1.972400906646088,
-        "se": 0.033466935554797926
+        "se": 0.033466935554797926,
+        "t_stat": 58.93580855099589,
+        "p_value": 0.005,
+        "conf_int": [
+          1.9108155783646885,
+          2.035952061830552
+        ]
       }
     }
   },
@@ -2976,15 +3084,33 @@
     "group_effects": {
       "3": {
         "effect": 1.9379732080320693,
-        "se": 0.027348748599256394
+        "se": 0.027348748599256394,
+        "t_stat": 70.86149485043576,
+        "p_value": 0.005,
+        "conf_int": [
+          1.8890625503369387,
+          1.9846384878549268
+        ]
       },
       "5": {
         "effect": 1.9776180319767032,
-        "se": 0.02946287209657048
+        "se": 0.02946287209657048,
+        "t_stat": 67.12237780127691,
+        "p_value": 0.005,
+        "conf_int": [
+          1.9220032490097771,
+          2.0295504746249913
+        ]
       },
       "7": {
         "effect": 1.9724482314870557,
-        "se": 0.03348899468270557
+        "se": 0.03348899468270557,
+        "t_stat": 58.89840080824135,
+        "p_value": 0.005,
+        "conf_int": [
+          1.9113054655520512,
+          2.0358791270186636
+        ]
       }
     }
   },
@@ -3403,15 +3529,33 @@
     "group_effects": {
       "3": {
         "effect": 1.9379731464282752,
-        "se": 0.027354393932262182
+        "se": 0.027354393932262182,
+        "t_stat": 70.84686837614781,
+        "p_value": 0.005,
+        "conf_int": [
+          1.8891430541850542,
+          1.9844547989387653
+        ]
       },
       "5": {
         "effect": 1.977618261825107,
-        "se": 0.029456139694155045
+        "se": 0.029456139694155045,
+        "t_stat": 67.13772688338805,
+        "p_value": 0.005,
+        "conf_int": [
+          1.9219215453418508,
+          2.02949447907519
+        ]
       },
       "7": {
         "effect": 1.9724360751947247,
-        "se": 0.03346783119193577
+        "se": 0.03346783119193577,
+        "t_stat": 58.93528217836812,
+        "p_value": 0.005,
+        "conf_int": [
+          1.912440579136104,
+          2.036883663702173
+        ]
       }
     }
   }
diff --git a/benchmarks/speed_review/validate_results.py b/benchmarks/speed_review/validate_results.py
@@ -107,6 +107,9 @@ def run_estimator(df, estimation_method="reg", covariates=None, control_group="n
             ge[str(g_key)] = {
                 "effect": float(data["effect"]),
                 "se": float(data["se"]),
+                "t_stat": float(data["t_stat"]),
+                "p_value": float(data["p_value"]),
+                "conf_int": [float(data["conf_int"][0]), float(data["conf_int"][1])],
             }
         out["group_effects"] = ge
 
@@ -235,6 +238,13 @@ def compare(label, base_val, cur_val, t):
                     continue
                 compare(f"{name}/ge[{g_key}].effect", b_ge["effect"], c_ge["effect"], scenario_tol)
                 compare(f"{name}/ge[{g_key}].se", b_ge["se"], c_ge["se"], gt_se_tol)
+                if "t_stat" in b_ge and "t_stat" in c_ge:
+                    compare(f"{name}/ge[{g_key}].t_stat", b_ge["t_stat"], c_ge["t_stat"], gt_se_tol)
+                if "p_value" in b_ge and "p_value" in c_ge:
+                    compare(f"{name}/ge[{g_key}].p_value", b_ge["p_value"], c_ge["p_value"], 0.02)
+                if "conf_int" in b_ge and "conf_int" in c_ge:
+                    for i, label in enumerate(["lower", "upper"]):
+                        compare(f"{name}/ge[{g_key}].ci.{label}", b_ge["conf_int"][i], c_ge["conf_int"][i], gt_se_tol)
 
         if failures:
             all_failures.extend(failures)
diff --git a/diff_diff/staggered_bootstrap.py b/diff_diff/staggered_bootstrap.py
@@ -204,6 +204,15 @@ def _run_multiplier_bootstrap(
         ], dtype=float)
         post_n_treated = all_n_treated[post_treatment_mask]
 
+        # Filter out NaN ATT(g,t) cells from overall aggregation (matches analytical path)
+        post_effects_raw = np.array([
+            group_time_effects[gt_pairs[i]]['effect'] for i in post_treatment_indices
+        ])
+        finite_post = np.isfinite(post_effects_raw)
+        if not np.all(finite_post):
+            post_treatment_indices = post_treatment_indices[finite_post]
+            post_n_treated = post_n_treated[finite_post]
+
         # Flag to skip overall ATT aggregation when no post-treatment effects
         # But continue bootstrap for per-effect SEs (pre-treatment effects need bootstrap SEs too)
         skip_overall_aggregation = False
@@ -297,7 +306,7 @@ def _run_multiplier_bootstrap(
             # Use combined IF (standard IF + WIF) for proper bootstrap
             post_gt_pairs = [gt_pairs[i] for i in post_treatment_indices]
             post_groups = np.array([gt_pairs[i][0] for i in post_treatment_indices])
-            post_effects = original_atts[post_treatment_mask]
+            post_effects = original_atts[post_treatment_indices]
             overall_combined_if, _ = self._compute_combined_influence_function(
                 post_gt_pairs, overall_weights_post, post_effects, post_groups,
                 influence_func_info, df, unit, precomputed,
@@ -503,6 +512,15 @@ def _prepare_event_study_aggregation(
             effects = np.array([x[1] for x in effect_list])
             n_treated = np.array([x[2] for x in effect_list], dtype=float)
 
+            # Exclude NaN effects (matches analytical aggregation path)
+            finite_mask = np.isfinite(effects)
+            if not np.all(finite_mask):
+                indices = indices[finite_mask]
+                effects = effects[finite_mask]
+                n_treated = n_treated[finite_mask]
+                if len(effects) == 0:
+                    continue
+
             weights = n_treated / np.sum(n_treated)
             agg_effect = np.sum(weights * effects)
 
@@ -553,6 +571,14 @@ def _prepare_group_aggregation(
             indices = np.array([x[0] for x in group_data])
             effects = np.array([x[1] for x in group_data])
 
+            # Exclude NaN effects (matches analytical aggregation path)
+            finite_mask = np.isfinite(effects)
+            if not np.all(finite_mask):
+                indices = indices[finite_mask]
+                effects = effects[finite_mask]
+                if len(effects) == 0:
+                    continue
+
             # Equal weights across time periods
             weights = np.ones(len(effects)) / len(effects)
             agg_effect = np.sum(weights * effects)
diff --git a/tests/test_staggered.py b/tests/test_staggered.py