From 13546f39eaf2d28a8f84d3b6e2ebb04731cb4cd4 Mon Sep 17 00:00:00 2001
From: igerber <isaac.gerber@gmail.com>
Date: Tue, 10 Feb 2026 15:46:15 -0500
Subject: [PATCH 1/9] SDID methodology review: rewrite to match R synthdid +
 Rust parallel variance
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Comprehensive review and rewrite of the Synthetic DiD implementation to match
R's synthdid package behavior (Arkhangelsky et al. 2021):

Methodology (Python):
- Frank-Wolfe solver matching R's sc.weight.fw() for unit and time weights
- Two-pass sparsification: 100 iters → sparsify → 10000 iters (matching R)
- Auto-computed regularization from data noise level (zeta_omega, zeta_lambda)
- Bootstrap SE uses fixed weights (matching R's bootstrap_sample)
- Placebo SE re-estimates weights per permutation (matching R's Algorithm 4)
- ATT estimator matches R's synthdid_estimate formula

Rust acceleration:
- New rust/src/sdid_variance.rs: parallel placebo and bootstrap SE via rayon
- placebo_variance_sdid(): ~8x speedup (200 permutations in parallel)
- bootstrap_variance_sdid(): ~6x speedup (200 bootstrap iterations in parallel)
- Frank-Wolfe solver in Rust (weights.rs) for unit and time weight computation
- Fix stale PyO3 defaults on sc_weight_fw and compute_sdid_unit_weights
- Make internal weight functions pub(crate) for cross-module access

Testing:
- 41 new methodology tests (test_methodology_sdid.py)
- 9 new Rust variance backend tests (test_rust_backend.py)
- Updated estimator and utility tests for new API
- All 31 SDID estimator tests pass in both Rust and pure Python modes

Documentation:
- Updated METHODOLOGY_REVIEW.md, REGISTRY.md, README.md, CLAUDE.md
- Updated tutorial notebook and benchmark scripts

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
---
 CLAUDE.md                               |   8 +
 METHODOLOGY_REVIEW.md                   |  33 +-
 README.md                               |  22 +-
 benchmarks/R/benchmark_synthdid.R       |  24 +-
 benchmarks/python/benchmark_synthdid.py |   6 +-
 diff_diff/_backend.py                   |  32 ++
 diff_diff/results.py                    |  18 +-
 diff_diff/synthetic_did.py              | 399 +++++++++++-----
 diff_diff/utils.py                      | 405 ++++++++++++++--
 docs/methodology/REGISTRY.md            | 107 ++++-
 docs/tutorials/03_synthetic_did.ipynb   |  75 +--
 rust/src/lib.rs                         |  13 +-
 rust/src/sdid_variance.rs               | 496 +++++++++++++++++++
 rust/src/weights.rs                     | 499 ++++++++++++++++++-
 tests/test_estimators.py                |  50 +-
 tests/test_methodology_sdid.py          | 605 ++++++++++++++++++++++++
 tests/test_rust_backend.py              | 478 +++++++++++++++++++
 tests/test_utils.py                     |  52 +-
 18 files changed, 3020 insertions(+), 302 deletions(-)
 create mode 100644 rust/src/sdid_variance.rs
 create mode 100644 tests/test_methodology_sdid.py

diff --git a/CLAUDE.md b/CLAUDE.md
index 783bcf47..e1d76280 100644
--- a/CLAUDE.md
+++ b/CLAUDE.md
@@ -68,6 +68,10 @@ cross-platform compilation - no OpenBLAS or Intel MKL installation required.
 
 - **`diff_diff/synthetic_did.py`** - Synthetic DiD estimator:
   - `SyntheticDiD` - Synthetic control combined with DiD (Arkhangelsky et al. 2021)
+  - Frank-Wolfe solver matching R's `synthdid::sc.weight.fw()` for unit and time weights
+  - Auto-computed regularization from data noise level (`zeta_omega`, `zeta_lambda`)
+  - Two-pass sparsification for unit weights (100 iters → sparsify → 1000 iters)
+  - Bootstrap SE uses fixed weights (matches R's `bootstrap_sample`)
 
 - **`diff_diff/staggered.py`** - Staggered adoption DiD main module:
   - `CallawaySantAnna` - Callaway & Sant'Anna (2021) estimator for heterogeneous treatment timing
@@ -163,6 +167,9 @@ cross-platform compilation - no OpenBLAS or Intel MKL installation required.
     - `compute_unit_distance_matrix()` - Parallel pairwise RMSE distance computation (4-8x speedup)
     - `loocv_grid_search()` - Parallel LOOCV across tuning parameters (10-50x speedup)
     - `bootstrap_trop_variance()` - Parallel bootstrap variance estimation (5-15x speedup)
+  - **`rust/src/sdid_variance.rs`** - SDID variance estimation acceleration:
+    - `placebo_variance_sdid()` - Parallel placebo SE computation (~8x speedup)
+    - `bootstrap_variance_sdid()` - Parallel bootstrap SE computation (~6x speedup)
   - Uses pure-Rust `faer` library for linear algebra (no external BLAS/LAPACK dependencies)
   - Cross-platform: builds on Linux, macOS, and Windows without additional setup
   - Provides 4-8x speedup for SyntheticDiD, 5-20x speedup for TROP
@@ -373,6 +380,7 @@ See `docs/benchmarks.rst` for full methodology and validation results.
 
 Tests mirror the source modules:
 - `tests/test_estimators.py` - Tests for DifferenceInDifferences, TWFE, MultiPeriodDiD, SyntheticDiD
+- `tests/test_methodology_sdid.py` - Methodology tests for SDID: Frank-Wolfe solver, regularization, sparsification, edge cases
 - `tests/test_staggered.py` - Tests for CallawaySantAnna
 - `tests/test_sun_abraham.py` - Tests for SunAbraham interaction-weighted estimator
 - `tests/test_imputation.py` - Tests for ImputationDiD (Borusyak et al. 2024) estimator
diff --git a/METHODOLOGY_REVIEW.md b/METHODOLOGY_REVIEW.md
index 884e735d..24903bd3 100644
--- a/METHODOLOGY_REVIEW.md
+++ b/METHODOLOGY_REVIEW.md
@@ -25,7 +25,7 @@ Each estimator in diff-diff should be periodically reviewed to ensure:
 | TwoWayFixedEffects | `twfe.py` | `fixest::feols()` | **Complete** | 2026-02-08 |
 | CallawaySantAnna | `staggered.py` | `did::att_gt()` | **Complete** | 2026-01-24 |
 | SunAbraham | `sun_abraham.py` | `fixest::sunab()` | Not Started | - |
-| SyntheticDiD | `synthetic_did.py` | `synthdid::synthdid_estimate()` | Not Started | - |
+| SyntheticDiD | `synthetic_did.py` | `synthdid::synthdid_estimate()` | **Complete** | 2026-02-10 |
 | TripleDifference | `triple_diff.py` | (forthcoming) | Not Started | - |
 | TROP | `trop.py` | (forthcoming) | Not Started | - |
 | BaconDecomposition | `bacon.py` | `bacondecomp::bacon()` | Not Started | - |
@@ -314,14 +314,37 @@ variables appear to the left of the `|` separator.
 | Module | `synthetic_did.py` |
 | Primary Reference | Arkhangelsky et al. (2021) |
 | R Reference | `synthdid::synthdid_estimate()` |
-| Status | Not Started |
-| Last Review | - |
+| Status | **Complete** |
+| Last Review | 2026-02-10 |
 
 **Corrections Made:**
-- (None yet)
+1. **Time weights: Frank-Wolfe on collapsed form** (was heuristic inverse-distance).
+   Replaced ad-hoc inverse-distance weighting with the Frank-Wolfe algorithm operating
+   on the collapsed (N_co x T_pre) problem as specified in Algorithm 1 of
+   Arkhangelsky et al. (2021), matching R's `synthdid::fw.step()`.
+2. **Unit weights: Frank-Wolfe with two-pass sparsification** (was projected gradient
+   descent with wrong penalty). Replaced projected gradient descent (which used an
+   incorrect penalty formulation) with Frank-Wolfe optimization followed by two-pass
+   sparsification, matching R's `synthdid::sc.weight.fw()` and `sparsify_function()`.
+3. **Auto-computed regularization from data noise level** (was `lambda_reg=0.0`,
+   `zeta=1.0`). Regularization parameters `zeta_omega` and `zeta_lambda` are now
+   computed automatically from the data noise level (N_tr * sigma^2) as specified in
+   Appendix D of Arkhangelsky et al. (2021), matching R's default behavior.
+4. **Bootstrap SE uses fixed weights matching R's `bootstrap_sample`** (was
+   re-estimating all weights). The bootstrap variance procedure now holds unit and time
+   weights fixed at their point estimates and only re-estimates the treatment effect,
+   matching the approach in R's `synthdid::bootstrap_sample()`.
+5. **Default `variance_method` changed to `"placebo"`** matching R's default. The R
+   package uses placebo variance by default (`synthdid_estimate` returns an object whose
+   `vcov()` uses the placebo method); our default now matches.
+6. **Deprecated `lambda_reg` and `zeta` params; new params are `zeta_omega` and
+   `zeta_lambda`**. The old parameters had unclear semantics and did not correspond to
+   the paper's notation. The new parameters directly match the paper and R package
+   naming conventions. `lambda_reg` and `zeta` are deprecated with warnings and will
+   be removed in a future release.
 
 **Outstanding Concerns:**
-- (None yet)
+- (None)
 
 ---
 
diff --git a/README.md b/README.md
index 55bd9aed..f7385ad4 100644
--- a/README.md
+++ b/README.md
@@ -1163,11 +1163,12 @@ Use Synthetic DiD instead of standard DiD when:
 
 ```python
 SyntheticDiD(
-    lambda_reg=0.0,     # Regularization toward uniform weights (0 = no reg)
-    zeta=1.0,           # Time weight regularization (higher = more uniform)
-    alpha=0.05,         # Significance level
-    n_bootstrap=200,    # Bootstrap iterations for SE (0 = placebo-based)
-    seed=None           # Random seed for reproducibility
+    zeta_omega=None,        # Unit weight regularization (None = auto-computed from data)
+    zeta_lambda=None,       # Time weight regularization (None = auto-computed from data)
+    alpha=0.05,             # Significance level
+    variance_method="placebo",  # "placebo" (default, matches R) or "bootstrap"
+    n_bootstrap=200,        # Replications for SE estimation
+    seed=None               # Random seed for reproducibility
 )
 ```
 
@@ -1872,11 +1873,12 @@ MultiPeriodDiD(
 
 ```python
 SyntheticDiD(
-    lambda_reg=0.0,     # L2 regularization for unit weights
-    zeta=1.0,           # Regularization for time weights
-    alpha=0.05,         # Significance level for CIs
-    n_bootstrap=200,    # Bootstrap iterations for SE
-    seed=None           # Random seed for reproducibility
+    zeta_omega=None,        # Unit weight regularization (None = auto from data)
+    zeta_lambda=None,       # Time weight regularization (None = auto from data)
+    alpha=0.05,             # Significance level for CIs
+    variance_method="placebo",  # "placebo" (R default) or "bootstrap"
+    n_bootstrap=200,        # Replications for SE estimation
+    seed=None               # Random seed for reproducibility
 )
 ```
 
diff --git a/benchmarks/R/benchmark_synthdid.R b/benchmarks/R/benchmark_synthdid.R
index b4069e52..1c36f7d4 100644
--- a/benchmarks/R/benchmark_synthdid.R
+++ b/benchmarks/R/benchmark_synthdid.R
@@ -82,6 +82,15 @@ se_time <- as.numeric(difftime(Sys.time(), se_start, units = "secs"))
 
 total_time <- estimation_time + se_time
 
+# Compute noise level and regularization (to match Python's auto-computed values)
+N0 <- setup$N0
+T0 <- setup$T0
+N1 <- nrow(setup$Y) - N0
+T1 <- ncol(setup$Y) - T0
+noise_level <- sd(apply(setup$Y[1:N0, 1:T0], 1, diff))
+zeta_omega <- ((N1 * T1)^(1/4)) * noise_level
+zeta_lambda <- 1e-6 * noise_level
+
 # Format output
 results <- list(
   estimator = "synthdid::synthdid_estimate",
@@ -90,10 +99,15 @@ results <- list(
   att = as.numeric(tau_hat),
   se = se,
 
-  # Weights
+  # Weights (full precision)
   unit_weights = as.numeric(unit_weights),
   time_weights = as.numeric(time_weights),
 
+  # Regularization parameters
+  noise_level = noise_level,
+  zeta_omega = zeta_omega,
+  zeta_lambda = zeta_lambda,
+
   # Timing
   timing = list(
     estimation_seconds = estimation_time,
@@ -105,10 +119,10 @@ results <- list(
   metadata = list(
     r_version = R.version.string,
     synthdid_version = as.character(packageVersion("synthdid")),
-    n_control = setup$N0,
-    n_treated = nrow(setup$Y) - setup$N0,
-    n_pre_periods = setup$T0,
-    n_post_periods = ncol(setup$Y) - setup$T0
+    n_control = N0,
+    n_treated = N1,
+    n_pre_periods = T0,
+    n_post_periods = T1
   )
 )
 
diff --git a/benchmarks/python/benchmark_synthdid.py b/benchmarks/python/benchmark_synthdid.py
index 4c1323b8..7986d35d 100644
--- a/benchmarks/python/benchmark_synthdid.py
+++ b/benchmarks/python/benchmark_synthdid.py
@@ -106,9 +106,13 @@ def main():
         # Point estimate and SE
         "att": float(results.att),
         "se": float(results.se),
-        # Weights
+        # Weights (full precision)
         "unit_weights": unit_weights_df["weight"].tolist(),
         "time_weights": time_weights_df["weight"].tolist(),
+        # Regularization parameters
+        "noise_level": float(results.noise_level) if results.noise_level is not None else None,
+        "zeta_omega": float(results.zeta_omega) if results.zeta_omega is not None else None,
+        "zeta_lambda": float(results.zeta_lambda) if results.zeta_lambda is not None else None,
         # Timing
         "timing": {
             "estimation_seconds": total_time,
diff --git a/diff_diff/_backend.py b/diff_diff/_backend.py
index 60bf853b..dd8af93c 100644
--- a/diff_diff/_backend.py
+++ b/diff_diff/_backend.py
@@ -30,6 +30,14 @@
         # TROP estimator acceleration (joint method)
         loocv_grid_search_joint as _rust_loocv_grid_search_joint,
         bootstrap_trop_variance_joint as _rust_bootstrap_trop_variance_joint,
+        # SDID weights (Frank-Wolfe matching R's synthdid)
+        compute_sdid_unit_weights as _rust_sdid_unit_weights,
+        compute_time_weights as _rust_compute_time_weights,
+        compute_noise_level as _rust_compute_noise_level,
+        sc_weight_fw as _rust_sc_weight_fw,
+        # SDID variance estimation (parallel placebo and bootstrap)
+        placebo_variance_sdid as _rust_placebo_variance_sdid,
+        bootstrap_variance_sdid as _rust_bootstrap_variance_sdid,
     )
     _rust_available = True
 except ImportError:
@@ -46,6 +54,14 @@
     # TROP estimator acceleration (joint method)
     _rust_loocv_grid_search_joint = None
     _rust_bootstrap_trop_variance_joint = None
+    # SDID weights (Frank-Wolfe matching R's synthdid)
+    _rust_sdid_unit_weights = None
+    _rust_compute_time_weights = None
+    _rust_compute_noise_level = None
+    _rust_sc_weight_fw = None
+    # SDID variance estimation (parallel placebo and bootstrap)
+    _rust_placebo_variance_sdid = None
+    _rust_bootstrap_variance_sdid = None
 
 # Determine final backend based on environment variable and availability
 if _backend_env == 'python':
@@ -63,6 +79,14 @@
     # TROP estimator acceleration (joint method)
     _rust_loocv_grid_search_joint = None
     _rust_bootstrap_trop_variance_joint = None
+    # SDID weights (Frank-Wolfe matching R's synthdid)
+    _rust_sdid_unit_weights = None
+    _rust_compute_time_weights = None
+    _rust_compute_noise_level = None
+    _rust_sc_weight_fw = None
+    # SDID variance estimation (parallel placebo and bootstrap)
+    _rust_placebo_variance_sdid = None
+    _rust_bootstrap_variance_sdid = None
 elif _backend_env == 'rust':
     # Force Rust mode - fail if not available
     if not _rust_available:
@@ -89,4 +113,12 @@
     # TROP estimator acceleration (joint method)
     '_rust_loocv_grid_search_joint',
     '_rust_bootstrap_trop_variance_joint',
+    # SDID weights (Frank-Wolfe matching R's synthdid)
+    '_rust_sdid_unit_weights',
+    '_rust_compute_time_weights',
+    '_rust_compute_noise_level',
+    '_rust_sc_weight_fw',
+    # SDID variance estimation (parallel placebo and bootstrap)
+    '_rust_placebo_variance_sdid',
+    '_rust_bootstrap_variance_sdid',
 ]
diff --git a/diff_diff/results.py b/diff_diff/results.py
index decdf5ba..5fefea62 100644
--- a/diff_diff/results.py
+++ b/diff_diff/results.py
@@ -605,8 +605,10 @@ class SyntheticDiDResults:
     pre_periods: List[Any]
     post_periods: List[Any]
     alpha: float = 0.05
-    variance_method: str = field(default="bootstrap")
-    lambda_reg: Optional[float] = field(default=None)
+    variance_method: str = field(default="placebo")
+    noise_level: Optional[float] = field(default=None)
+    zeta_omega: Optional[float] = field(default=None)
+    zeta_lambda: Optional[float] = field(default=None)
     pre_treatment_fit: Optional[float] = field(default=None)
     placebo_effects: Optional[np.ndarray] = field(default=None)
     n_bootstrap: Optional[int] = field(default=None)
@@ -650,8 +652,12 @@ def summary(self, alpha: Optional[float] = None) -> str:
             f"{'Post-treatment periods:':<25} {len(self.post_periods):>10}",
         ]
 
-        if self.lambda_reg is not None:
-            lines.append(f"{'Regularization (lambda):':<25} {self.lambda_reg:>10.4f}")
+        if self.zeta_omega is not None:
+            lines.append(f"{'Zeta (unit weights):':<25} {self.zeta_omega:>10.4f}")
+        if self.zeta_lambda is not None:
+            lines.append(f"{'Zeta (time weights):':<25} {self.zeta_lambda:>10.6f}")
+        if self.noise_level is not None:
+            lines.append(f"{'Noise level:':<25} {self.noise_level:>10.4f}")
 
         if self.pre_treatment_fit is not None:
             lines.append(f"{'Pre-treatment fit (RMSE):':<25} {self.pre_treatment_fit:>10.4f}")
@@ -731,7 +737,9 @@ def to_dict(self) -> Dict[str, Any]:
             "n_pre_periods": len(self.pre_periods),
             "n_post_periods": len(self.post_periods),
             "variance_method": self.variance_method,
-            "lambda_reg": self.lambda_reg,
+            "noise_level": self.noise_level,
+            "zeta_omega": self.zeta_omega,
+            "zeta_lambda": self.zeta_lambda,
             "pre_treatment_fit": self.pre_treatment_fit,
         }
         if self.n_bootstrap is not None:
diff --git a/diff_diff/synthetic_did.py b/diff_diff/synthetic_did.py
index dca934bb..f77d4ca4 100644
--- a/diff_diff/synthetic_did.py
+++ b/diff_diff/synthetic_did.py
@@ -13,10 +13,12 @@
 from diff_diff.linalg import solve_ols
 from diff_diff.results import SyntheticDiDResults
 from diff_diff.utils import (
+    _compute_regularization,
+    _sum_normalize,
     compute_confidence_interval,
     compute_p_value,
     compute_sdid_estimator,
-    compute_synthetic_weights,
+    compute_sdid_unit_weights,
     compute_time_weights,
     validate_binary,
 )
@@ -38,21 +40,20 @@ class SyntheticDiD(DifferenceInDifferences):
 
     Parameters
     ----------
-    lambda_reg : float, default=0.0
-        L2 regularization for unit weights. Larger values shrink weights
-        toward uniform. Useful when n_pre_periods < n_control_units.
-    zeta : float, default=1.0
-        Regularization for time weights. Larger values give more uniform
-        time weights (closer to standard DiD).
+    zeta_omega : float, optional
+        Regularization for unit weights. If None (default), auto-computed
+        from data as ``(N1 * T1)^(1/4) * noise_level`` matching R's synthdid.
+    zeta_lambda : float, optional
+        Regularization for time weights. If None (default), auto-computed
+        from data as ``1e-6 * noise_level`` matching R's synthdid.
     alpha : float, default=0.05
         Significance level for confidence intervals.
-    variance_method : str, default="bootstrap"
+    variance_method : str, default="placebo"
         Method for variance estimation:
-        - "bootstrap": Block bootstrap at unit level (default)
         - "placebo": Placebo-based variance matching R's synthdid::vcov(method="placebo").
-          Implements Algorithm 4 from Arkhangelsky et al. (2021): randomly permutes
-          control units, designates N₁ as pseudo-treated, renormalizes original
-          weights for remaining pseudo-controls, and computes SDID estimate.
+          Implements Algorithm 4 from Arkhangelsky et al. (2021). This is R's default.
+        - "bootstrap": Bootstrap at unit level with fixed weights matching R's
+          synthdid::vcov(method="bootstrap").
     n_bootstrap : int, default=200
         Number of replications for variance estimation. Used for both:
         - Bootstrap: Number of bootstrap samples
@@ -130,16 +131,36 @@ class SyntheticDiD(DifferenceInDifferences):
 
     def __init__(
         self,
-        lambda_reg: float = 0.0,
-        zeta: float = 1.0,
+        zeta_omega: Optional[float] = None,
+        zeta_lambda: Optional[float] = None,
         alpha: float = 0.05,
-        variance_method: str = "bootstrap",
+        variance_method: str = "placebo",
         n_bootstrap: int = 200,
-        seed: Optional[int] = None
+        seed: Optional[int] = None,
+        # Deprecated — accepted for backward compat, ignored with warning
+        lambda_reg: Optional[float] = None,
+        zeta: Optional[float] = None,
+        **kwargs,
     ):
+        if lambda_reg is not None:
+            warnings.warn(
+                "lambda_reg is deprecated and ignored. Regularization is now "
+                "auto-computed from data. Use zeta_omega to override unit weight "
+                "regularization.",
+                DeprecationWarning,
+                stacklevel=2,
+            )
+        if zeta is not None:
+            warnings.warn(
+                "zeta is deprecated and ignored. Use zeta_lambda to override "
+                "time weight regularization.",
+                DeprecationWarning,
+                stacklevel=2,
+            )
+
         super().__init__(robust=True, cluster=None, alpha=alpha)
-        self.lambda_reg = lambda_reg
-        self.zeta = zeta
+        self.zeta_omega = zeta_omega
+        self.zeta_lambda = zeta_lambda
         self.variance_method = variance_method
         self.n_bootstrap = n_bootstrap
         self.seed = seed
@@ -270,21 +291,36 @@ def fit(  # type: ignore[override]
                 pre_periods, post_periods, treated_units, control_units
             )
 
-        # Compute unit weights (synthetic control weights)
-        # Average treated outcomes across treated units
+        # Compute auto-regularization (or use user overrides)
+        auto_zeta_omega, auto_zeta_lambda = _compute_regularization(
+            Y_pre_control, len(treated_units), len(post_periods)
+        )
+        zeta_omega = self.zeta_omega if self.zeta_omega is not None else auto_zeta_omega
+        zeta_lambda = self.zeta_lambda if self.zeta_lambda is not None else auto_zeta_lambda
+
+        # Store noise level for diagnostics
+        from diff_diff.utils import _compute_noise_level
+        noise_level = _compute_noise_level(Y_pre_control)
+
+        # Data-dependent convergence threshold (matches R's 1e-5 * noise.level)
+        min_decrease = 1e-5 * noise_level if noise_level > 0 else 1e-5
+
+        # Compute unit weights (Frank-Wolfe with sparsification)
         Y_pre_treated_mean = np.mean(Y_pre_treated, axis=1)
 
-        unit_weights = compute_synthetic_weights(
+        unit_weights = compute_sdid_unit_weights(
             Y_pre_control,
             Y_pre_treated_mean,
-            lambda_reg=self.lambda_reg
+            zeta_omega=zeta_omega,
+            min_decrease=min_decrease,
         )
 
-        # Compute time weights
+        # Compute time weights (Frank-Wolfe on collapsed form)
         time_weights = compute_time_weights(
             Y_pre_control,
-            Y_pre_treated_mean,
-            zeta=self.zeta
+            Y_post_control,
+            zeta_lambda=zeta_lambda,
+            min_decrease=min_decrease,
         )
 
         # Compute SDID estimate
@@ -306,8 +342,9 @@ def fit(  # type: ignore[override]
         # Compute standard errors based on variance_method
         if self.variance_method == "bootstrap":
             se, bootstrap_estimates = self._bootstrap_se(
-                working_data, outcome, unit, time,
-                pre_periods, post_periods, treated_units, control_units
+                Y_pre_control, Y_post_control,
+                Y_pre_treated, Y_post_treated,
+                unit_weights, time_weights,
             )
             placebo_effects = bootstrap_estimates
             inference_method = "bootstrap"
@@ -321,6 +358,9 @@ def fit(  # type: ignore[override]
                 unit_weights,
                 time_weights,
                 n_treated=len(treated_units),
+                zeta_omega=zeta_omega,
+                zeta_lambda=zeta_lambda,
+                min_decrease=min_decrease,
                 replications=self.n_bootstrap  # Reuse n_bootstrap for replications
             )
             inference_method = "placebo"
@@ -336,11 +376,14 @@ def fit(  # type: ignore[override]
             else:
                 p_value = compute_p_value(t_stat)
         else:
-            t_stat = 0.0
-            p_value = 1.0
+            t_stat = np.nan
+            p_value = np.nan
 
         # Confidence interval
-        conf_int = compute_confidence_interval(att, se, self.alpha)
+        if se > 0:
+            conf_int = compute_confidence_interval(att, se, self.alpha)
+        else:
+            conf_int = (np.nan, np.nan)
 
         # Create weight dictionaries
         unit_weights_dict = {
@@ -366,7 +409,9 @@ def fit(  # type: ignore[override]
             post_periods=post_periods,
             alpha=self.alpha,
             variance_method=inference_method,
-            lambda_reg=self.lambda_reg,
+            noise_level=noise_level,
+            zeta_omega=zeta_omega,
+            zeta_lambda=zeta_lambda,
             pre_treatment_fit=pre_fit_rmse,
             placebo_effects=placebo_effects if len(placebo_effects) > 0 else None,
             n_bootstrap=self.n_bootstrap if inference_method == "bootstrap" else None
@@ -455,78 +500,132 @@ def _residualize_covariates(
 
     def _bootstrap_se(
         self,
-        data: pd.DataFrame,
-        outcome: str,
-        unit: str,
-        time: str,
-        pre_periods: List[Any],
-        post_periods: List[Any],
-        treated_units: List[Any],
-        control_units: List[Any]
+        Y_pre_control: np.ndarray,
+        Y_post_control: np.ndarray,
+        Y_pre_treated: np.ndarray,
+        Y_post_treated: np.ndarray,
+        unit_weights: np.ndarray,
+        time_weights: np.ndarray,
     ) -> Tuple[float, np.ndarray]:
-        """
-        Compute bootstrap standard error.
+        """Compute bootstrap standard error matching R's synthdid bootstrap_sample.
+
+        Resamples all units (control + treated) with replacement, renormalizes
+        original unit weights for the resampled controls, and computes the
+        SDID estimator with **fixed** weights (no re-estimation).
 
-        Uses block bootstrap at the unit level.
+        This matches R's ``synthdid::vcov(method="bootstrap")``.
         """
         rng = np.random.default_rng(self.seed)
+        n_control = Y_pre_control.shape[1]
+        n_treated = Y_pre_treated.shape[1]
+        n_total = n_control + n_treated
+
+        # Build full panel matrix: (n_pre+n_post, n_control+n_treated)
+        Y_full = np.block([
+            [Y_pre_control, Y_pre_treated],
+            [Y_post_control, Y_post_treated]
+        ])
+        n_pre = Y_pre_control.shape[0]
+
+        # Try Rust parallel implementation for ~6x speedup
+        from diff_diff._backend import HAS_RUST_BACKEND, _rust_bootstrap_variance_sdid
+
+        if HAS_RUST_BACKEND and _rust_bootstrap_variance_sdid is not None:
+            # Generate random seed when self.seed is None
+            rust_seed = self.seed if self.seed is not None else int(
+                np.random.default_rng(None).integers(0, 2**63)
+            )
+
+            se, boot_arr, n_failed = _rust_bootstrap_variance_sdid(
+                np.ascontiguousarray(Y_pre_control, dtype=np.float64),
+                np.ascontiguousarray(Y_post_control, dtype=np.float64),
+                np.ascontiguousarray(Y_pre_treated, dtype=np.float64),
+                np.ascontiguousarray(Y_post_treated, dtype=np.float64),
+                np.ascontiguousarray(unit_weights, dtype=np.float64),
+                np.ascontiguousarray(time_weights, dtype=np.float64),
+                self.n_bootstrap, rust_seed,
+            )
+            bootstrap_estimates = np.asarray(boot_arr)
+            n_successful = len(bootstrap_estimates)
+            failure_rate = 1 - (n_successful / self.n_bootstrap)
+
+            # Apply same warning/error logic as Python path
+            if n_successful == 0:
+                raise ValueError(
+                    f"All {self.n_bootstrap} bootstrap iterations failed. "
+                    f"This typically occurs when:\n"
+                    f"  - Sample size is too small for reliable resampling\n"
+                    f"  - Weight matrices are singular or near-singular\n"
+                    f"  - Insufficient pre-treatment periods for weight estimation\n"
+                    f"  - Too few control units relative to treated units\n"
+                    f"Consider using variance_method='placebo' or increasing "
+                    f"the regularization parameters (zeta_omega, zeta_lambda)."
+                )
+            elif n_successful == 1:
+                warnings.warn(
+                    f"Only 1/{self.n_bootstrap} bootstrap iteration succeeded. "
+                    f"Standard error cannot be computed reliably (requires at least 2). "
+                    f"Returning SE=0.0. Consider using variance_method='placebo' or "
+                    f"increasing the regularization (zeta_omega, zeta_lambda).",
+                    UserWarning,
+                    stacklevel=2,
+                )
+                return 0.0, bootstrap_estimates
+            elif failure_rate > 0.05:
+                warnings.warn(
+                    f"Only {n_successful}/{self.n_bootstrap} bootstrap iterations succeeded "
+                    f"({failure_rate:.1%} failure rate). Standard errors may be unreliable. "
+                    f"This can occur with small samples or insufficient pre-treatment periods.",
+                    UserWarning,
+                    stacklevel=2,
+                )
 
-        all_units = treated_units + control_units
-        n_units = len(all_units)
+            return se, bootstrap_estimates
 
+        # Python fallback
         bootstrap_estimates = []
 
         for _ in range(self.n_bootstrap):
-            # Sample units with replacement
-            sampled_units = rng.choice(all_units, size=n_units, replace=True)
-
-            # Create bootstrap sample
-            boot_data = pd.concat([
-                data[data[unit] == u].assign(**{unit: f"{u}_{i}"})
-                for i, u in enumerate(sampled_units)
-            ], ignore_index=True)
-
-            # Identify treated/control in bootstrap sample
-            boot_treated = [
-                f"{u}_{i}" for i, u in enumerate(sampled_units)
-                if u in treated_units
-            ]
-            boot_control = [
-                f"{u}_{i}" for i, u in enumerate(sampled_units)
-                if u in control_units
-            ]
-
-            if len(boot_treated) == 0 or len(boot_control) == 0:
+            # Resample ALL units with replacement
+            boot_idx = rng.choice(n_total, size=n_total, replace=True)
+
+            # Identify which resampled units are control vs treated
+            boot_is_control = boot_idx < n_control
+            boot_control_idx = boot_idx[boot_is_control]
+            boot_treated_idx = boot_idx[~boot_is_control]
+
+            # Skip if no control or no treated units in bootstrap sample
+            if len(boot_control_idx) == 0 or len(boot_treated_idx) == 0:
                 continue
 
             try:
-                # Create matrices
-                Y_pre_c, Y_post_c, Y_pre_t, Y_post_t = self._create_outcome_matrices(
-                    boot_data, outcome, unit, time,
-                    pre_periods, post_periods, boot_treated, boot_control
-                )
+                # Renormalize original unit weights for the resampled controls
+                boot_omega = _sum_normalize(unit_weights[boot_control_idx])
 
-                # Compute weights
-                Y_pre_t_mean = np.mean(Y_pre_t, axis=1)
-                Y_post_t_mean = np.mean(Y_post_t, axis=1)
+                # Extract resampled outcome matrices
+                Y_boot = Y_full[:, boot_idx]
+                Y_boot_pre_c = Y_boot[:n_pre, boot_is_control]
+                Y_boot_post_c = Y_boot[n_pre:, boot_is_control]
+                Y_boot_pre_t = Y_boot[:n_pre, ~boot_is_control]
+                Y_boot_post_t = Y_boot[n_pre:, ~boot_is_control]
 
-                w = compute_synthetic_weights(Y_pre_c, Y_pre_t_mean, self.lambda_reg)
-                t_w = compute_time_weights(Y_pre_c, Y_pre_t_mean, self.zeta)
+                # Compute ATT with FIXED weights (do NOT re-estimate)
+                Y_boot_pre_t_mean = np.mean(Y_boot_pre_t, axis=1)
+                Y_boot_post_t_mean = np.mean(Y_boot_post_t, axis=1)
 
-                # Compute estimate
                 tau = compute_sdid_estimator(
-                    Y_pre_c, Y_post_c, Y_pre_t_mean, Y_post_t_mean, w, t_w
+                    Y_boot_pre_c, Y_boot_post_c,
+                    Y_boot_pre_t_mean, Y_boot_post_t_mean,
+                    boot_omega, time_weights  # time_weights = original lambda
                 )
                 bootstrap_estimates.append(tau)
 
-            except (ValueError, LinAlgError, KeyError):
-                # Skip failed bootstrap iterations (e.g., singular matrices,
-                # missing data in resampled units, or invalid weight computations)
+            except (ValueError, LinAlgError):
                 continue
 
         bootstrap_estimates = np.array(bootstrap_estimates)
 
-        # Check bootstrap success rate and handle failures appropriately
+        # Check bootstrap success rate and handle failures
         n_successful = len(bootstrap_estimates)
         failure_rate = 1 - (n_successful / self.n_bootstrap)
 
@@ -538,16 +637,15 @@ def _bootstrap_se(
                 f"  - Weight matrices are singular or near-singular\n"
                 f"  - Insufficient pre-treatment periods for weight estimation\n"
                 f"  - Too few control units relative to treated units\n"
-                f"Consider using n_bootstrap=0 to disable bootstrap inference "
-                f"and rely on placebo-based standard errors, or increase "
-                f"the regularization parameters (lambda_reg, zeta)."
+                f"Consider using variance_method='placebo' or increasing "
+                f"the regularization parameters (zeta_omega, zeta_lambda)."
             )
         elif n_successful == 1:
             warnings.warn(
                 f"Only 1/{self.n_bootstrap} bootstrap iteration succeeded. "
                 f"Standard error cannot be computed reliably (requires at least 2). "
-                f"Returning SE=0.0. Consider the suggestions above for improving "
-                f"bootstrap convergence.",
+                f"Returning SE=0.0. Consider using variance_method='placebo' or "
+                f"increasing the regularization (zeta_omega, zeta_lambda).",
                 UserWarning,
                 stacklevel=2,
             )
@@ -556,14 +654,13 @@ def _bootstrap_se(
             warnings.warn(
                 f"Only {n_successful}/{self.n_bootstrap} bootstrap iterations succeeded "
                 f"({failure_rate:.1%} failure rate). Standard errors may be unreliable. "
-                f"This can occur with small samples, near-singular weight matrices, "
-                f"or insufficient pre-treatment periods.",
+                f"This can occur with small samples or insufficient pre-treatment periods.",
                 UserWarning,
                 stacklevel=2,
             )
-            se = np.std(bootstrap_estimates, ddof=1)
+            se = float(np.std(bootstrap_estimates, ddof=1))
         else:
-            se = np.std(bootstrap_estimates, ddof=1)
+            se = float(np.std(bootstrap_estimates, ddof=1))
 
         return se, bootstrap_estimates
 
@@ -576,6 +673,9 @@ def _placebo_variance_se(
         unit_weights: np.ndarray,
         time_weights: np.ndarray,
         n_treated: int,
+        zeta_omega: float = 0.0,
+        zeta_lambda: float = 0.0,
+        min_decrease: float = 1e-5,
         replications: int = 200
     ) -> Tuple[float, np.ndarray]:
         """
@@ -586,8 +686,10 @@ def _placebo_variance_se(
 
         1. Randomly sample N₀ control indices (permutation)
         2. Designate last N₁ as pseudo-treated, first (N₀-N₁) as pseudo-controls
-        3. Renormalize original unit weights for pseudo-controls
-        4. Compute SDID estimate using renormalized weights
+        3. Re-estimate both omega and lambda on the permuted data (using
+           original weights as initialization), matching R's behavior where
+           ``update.omega=TRUE, update.lambda=TRUE`` are passed via ``opts``
+        4. Compute SDID estimate with re-estimated weights
         5. Repeat `replications` times
         6. SE = sqrt((r-1)/r) * sd(estimates)
 
@@ -607,6 +709,12 @@ def _placebo_variance_se(
             Time weights from main estimation, shape (n_pre,).
         n_treated : int
             Number of treated units in the original estimation.
+        zeta_omega : float
+            Regularization parameter for unit weights (for re-estimation).
+        zeta_lambda : float
+            Regularization parameter for time weights (for re-estimation).
+        min_decrease : float
+            Convergence threshold for Frank-Wolfe (for re-estimation).
         replications : int, default=200
             Number of placebo replications.
 
@@ -637,6 +745,53 @@ def _placebo_variance_se(
             )
             return 0.0, np.array([])
 
+        # Try Rust parallel implementation for ~8x speedup
+        from diff_diff._backend import HAS_RUST_BACKEND, _rust_placebo_variance_sdid
+
+        if HAS_RUST_BACKEND and _rust_placebo_variance_sdid is not None:
+            # Generate random seed when self.seed is None (matching Python's non-reproducible behavior)
+            rust_seed = self.seed if self.seed is not None else int(
+                np.random.default_rng(None).integers(0, 2**63)
+            )
+
+            se, placebo_arr = _rust_placebo_variance_sdid(
+                np.ascontiguousarray(Y_pre_control, dtype=np.float64),
+                np.ascontiguousarray(Y_post_control, dtype=np.float64),
+                np.ascontiguousarray(Y_pre_treated_mean, dtype=np.float64),
+                np.ascontiguousarray(Y_post_treated_mean, dtype=np.float64),
+                n_treated, zeta_omega, zeta_lambda, min_decrease,
+                True,   # intercept
+                100,    # max_iter_pre_sparsify
+                10000,  # max_iter
+                replications, rust_seed,
+            )
+            placebo_estimates = np.asarray(placebo_arr)
+            n_successful = len(placebo_estimates)
+
+            # Apply same warning/error logic as Python path
+            if n_successful < 2:
+                warnings.warn(
+                    f"Only {n_successful} placebo replications completed successfully. "
+                    f"Standard error cannot be estimated reliably. "
+                    f"Consider using variance_method='bootstrap' or increasing "
+                    f"the number of control units.",
+                    UserWarning,
+                    stacklevel=3,
+                )
+                return 0.0, placebo_estimates
+
+            failure_rate = 1 - (n_successful / replications)
+            if failure_rate > 0.05:
+                warnings.warn(
+                    f"Only {n_successful}/{replications} placebo replications succeeded "
+                    f"({failure_rate:.1%} failure rate). Standard errors may be unreliable.",
+                    UserWarning,
+                    stacklevel=3,
+                )
+
+            return se, placebo_estimates
+
+        # Python fallback
         placebo_estimates = []
 
         for _ in range(replications):
@@ -648,36 +803,43 @@ def _placebo_variance_se(
                 pseudo_control_idx = perm[:n_pseudo_control]
                 pseudo_treated_idx = perm[n_pseudo_control:]
 
-                # Renormalize original weights for pseudo-controls (step 3)
-                # This keeps the relative importance from the main estimation
-                pseudo_weights = unit_weights[pseudo_control_idx]
-                weight_sum = pseudo_weights.sum()
-                if weight_sum > 0:
-                    pseudo_weights = pseudo_weights / weight_sum
-                else:
-                    # Fallback to uniform if weights sum to zero
-                    pseudo_weights = np.ones(n_pseudo_control) / n_pseudo_control
-
-                # Get pseudo-treated outcomes (mean across pseudo-treated units)
-                Y_pre_pseudo_treated = np.mean(
+                # Get pseudo-control and pseudo-treated outcomes
+                Y_pre_pseudo_control = Y_pre_control[:, pseudo_control_idx]
+                Y_post_pseudo_control = Y_post_control[:, pseudo_control_idx]
+                Y_pre_pseudo_treated_mean = np.mean(
                     Y_pre_control[:, pseudo_treated_idx], axis=1
                 )
-                Y_post_pseudo_treated = np.mean(
+                Y_post_pseudo_treated_mean = np.mean(
                     Y_post_control[:, pseudo_treated_idx], axis=1
                 )
 
-                # Get pseudo-control outcomes
-                Y_pre_pseudo_control = Y_pre_control[:, pseudo_control_idx]
-                Y_post_pseudo_control = Y_post_control[:, pseudo_control_idx]
+                # Re-estimate weights on permuted data (matching R's behavior)
+                # R passes update.omega=TRUE, update.lambda=TRUE via opts,
+                # using original weights as starting points for FW optimization.
+                # Unit weights: re-estimate on pseudo-control/pseudo-treated data
+                pseudo_omega = compute_sdid_unit_weights(
+                    Y_pre_pseudo_control,
+                    Y_pre_pseudo_treated_mean,
+                    zeta_omega=zeta_omega,
+                    min_decrease=min_decrease,
+                )
+
+                # Time weights: re-estimate on pseudo-control data
+                pseudo_lambda = compute_time_weights(
+                    Y_pre_pseudo_control,
+                    Y_post_pseudo_control,
+                    zeta_lambda=zeta_lambda,
+                    min_decrease=min_decrease,
+                )
 
                 # Compute placebo SDID estimate (step 4)
                 tau = compute_sdid_estimator(
                     Y_pre_pseudo_control,
                     Y_post_pseudo_control,
-                    Y_pre_pseudo_treated,
-                    Y_post_pseudo_treated,
-                    pseudo_weights,
-                    time_weights
+                    Y_pre_pseudo_treated_mean,
+                    Y_post_pseudo_treated_mean,
+                    pseudo_omega,
+                    pseudo_lambda
                 )
                 placebo_estimates.append(tau)
 
@@ -720,8 +882,8 @@ def _placebo_variance_se(
     def get_params(self) -> Dict[str, Any]:
         """Get estimator parameters."""
         return {
-            "lambda_reg": self.lambda_reg,
-            "zeta": self.zeta,
+            "zeta_omega": self.zeta_omega,
+            "zeta_lambda": self.zeta_lambda,
             "alpha": self.alpha,
             "variance_method": self.variance_method,
             "n_bootstrap": self.n_bootstrap,
@@ -730,8 +892,17 @@ def get_params(self) -> Dict[str, Any]:
 
     def set_params(self, **params) -> "SyntheticDiD":
         """Set estimator parameters."""
+        # Deprecated parameter names — emit warning and ignore
+        _deprecated = {"lambda_reg", "zeta"}
         for key, value in params.items():
-            if hasattr(self, key):
+            if key in _deprecated:
+                warnings.warn(
+                    f"{key} is deprecated and ignored. Use zeta_omega/zeta_lambda "
+                    f"instead.",
+                    DeprecationWarning,
+                    stacklevel=2,
+                )
+            elif hasattr(self, key):
                 setattr(self, key, value)
             else:
                 raise ValueError(f"Unknown parameter: {key}")
diff --git a/diff_diff/utils.py b/diff_diff/utils.py
index 010d0111..71f9d80f 100644
--- a/diff_diff/utils.py
+++ b/diff_diff/utils.py
@@ -18,6 +18,10 @@
     HAS_RUST_BACKEND,
     _rust_project_simplex,
     _rust_synthetic_weights,
+    _rust_sdid_unit_weights,
+    _rust_compute_time_weights,
+    _rust_compute_noise_level,
+    _rust_sc_weight_fw,
 )
 
 # Numerical constants for optimization algorithms
@@ -1147,57 +1151,394 @@ def _project_simplex(v: np.ndarray) -> np.ndarray:
     return np.asarray(np.maximum(v - theta, 0))
 
 
-def compute_time_weights(
-    Y_control: np.ndarray,
-    Y_treated: np.ndarray,
-    zeta: float = 1.0
+# =============================================================================
+# SDID Weight Optimization (Frank-Wolfe, matching R's synthdid)
+# =============================================================================
+
+
+def _sum_normalize(v: np.ndarray) -> np.ndarray:
+    """Normalize vector to sum to 1. Fallback to uniform if sum is zero.
+
+    Matches R's synthdid ``sum_normalize()`` helper.
+    """
+    s = np.sum(v)
+    if s > 0:
+        return v / s
+    return np.ones(len(v)) / len(v)
+
+
+def _compute_noise_level(Y_pre_control: np.ndarray) -> float:
+    """Compute noise level from first-differences of control outcomes.
+
+    Matches R's ``sd(apply(Y[1:N0, 1:T0], 1, diff))`` which computes
+    first-differences across time for each control unit, then takes the
+    pooled standard deviation.
+
+    Parameters
+    ----------
+    Y_pre_control : np.ndarray
+        Control unit pre-treatment outcomes, shape (n_pre, n_control).
+
+    Returns
+    -------
+    float
+        Noise level (standard deviation of first-differences).
+    """
+    if HAS_RUST_BACKEND:
+        return float(_rust_compute_noise_level(np.ascontiguousarray(Y_pre_control)))
+    return _compute_noise_level_numpy(Y_pre_control)
+
+
+def _compute_noise_level_numpy(Y_pre_control: np.ndarray) -> float:
+    """Pure NumPy implementation of noise level computation."""
+    if Y_pre_control.shape[0] < 2:
+        return 0.0
+    # R: apply(Y[1:N0, 1:T0], 1, diff) computes diff per row (unit).
+    # Our matrix is (T, N) so diff along axis=0 gives (T-1, N).
+    first_diffs = np.diff(Y_pre_control, axis=0)  # (T_pre-1, N_co)
+    if first_diffs.size == 0:
+        return 0.0
+    return float(np.std(first_diffs, ddof=1))
+
+
+def _compute_regularization(
+    Y_pre_control: np.ndarray,
+    n_treated: int,
+    n_post: int,
+) -> tuple:
+    """Compute auto-regularization parameters matching R's synthdid.
+
+    Parameters
+    ----------
+    Y_pre_control : np.ndarray
+        Control unit pre-treatment outcomes, shape (n_pre, n_control).
+    n_treated : int
+        Number of treated units.
+    n_post : int
+        Number of post-treatment periods.
+
+    Returns
+    -------
+    tuple
+        (zeta_omega, zeta_lambda) regularization parameters.
+    """
+    sigma = _compute_noise_level(Y_pre_control)
+    eta_omega = (n_treated * n_post) ** 0.25
+    eta_lambda = 1e-6
+    return eta_omega * sigma, eta_lambda * sigma
+
+
+def _fw_step(
+    A: np.ndarray,
+    x: np.ndarray,
+    b: np.ndarray,
+    eta: float,
 ) -> np.ndarray:
+    """Single Frank-Wolfe step on the simplex.
+
+    Matches R's ``fw.step()`` in synthdid's ``sc.weight.fw()``.
+
+    Parameters
+    ----------
+    A : np.ndarray
+        Matrix of shape (N, T0).
+    x : np.ndarray
+        Current weight vector of shape (T0,).
+    b : np.ndarray
+        Target vector of shape (N,).
+    eta : float
+        Regularization strength (N * zeta^2).
+
+    Returns
+    -------
+    np.ndarray
+        Updated weight vector on the simplex.
     """
-    Compute time weights for synthetic DiD.
+    Ax = A @ x
+    half_grad = A.T @ (Ax - b) + eta * x
+    i = int(np.argmin(half_grad))
+    d_x = -x.copy()
+    d_x[i] += 1.0
+    if np.allclose(d_x, 0.0):
+        return x.copy()
+    d_err = A[:, i] - Ax
+    denom = d_err @ d_err + eta * (d_x @ d_x)
+    if denom <= 0:
+        return x.copy()
+    step = -(half_grad @ d_x) / denom
+    step = float(np.clip(step, 0.0, 1.0))
+    return x + step * d_x
+
+
+def _sc_weight_fw(
+    Y: np.ndarray,
+    zeta: float,
+    intercept: bool = True,
+    init_weights: Optional[np.ndarray] = None,
+    min_decrease: float = 1e-5,
+    max_iter: int = 10000,
+) -> np.ndarray:
+    """Compute synthetic control weights via Frank-Wolfe optimization.
 
-    Time weights emphasize pre-treatment periods where the outcome
-    is more informative for constructing the synthetic control.
-    Based on the SDID approach from Arkhangelsky et al. (2021).
+    Matches R's ``sc.weight.fw()`` from the synthdid package. Solves::
+
+        min_{lambda on simplex}  zeta^2 * ||lambda||^2
+            + (1/N) * ||A_centered @ lambda - b_centered||^2
 
     Parameters
     ----------
-    Y_control : np.ndarray
-        Control unit outcomes of shape (n_pre_periods, n_control_units).
-    Y_treated : np.ndarray
-        Treated unit mean outcomes of shape (n_pre_periods,).
-    zeta : float, default=1.0
-        Regularization parameter for time weights. Higher values
-        give more uniform weights.
+    Y : np.ndarray
+        Matrix of shape (N, T0+1). Last column is the target (post-period
+        mean or treated pre-period mean depending on context).
+    zeta : float
+        Regularization strength.
+    intercept : bool, default True
+        If True, column-center Y before optimization.
+    init_weights : np.ndarray, optional
+        Initial weights. If None, starts with uniform weights.
+    min_decrease : float, default 1e-5
+        Convergence criterion: stop when objective decreases by less than
+        ``min_decrease**2``. R uses ``1e-5 * noise_level``; the caller
+        should pass the data-dependent value for best results.
+    max_iter : int, default 10000
+        Maximum number of iterations. Matches R's default.
 
     Returns
     -------
     np.ndarray
-        Time weights of shape (n_pre_periods,) that sum to 1.
+        Weights of shape (T0,) on the simplex.
+    """
+    if HAS_RUST_BACKEND:
+        return np.asarray(_rust_sc_weight_fw(
+            np.ascontiguousarray(Y, dtype=np.float64),
+            zeta, intercept,
+            np.ascontiguousarray(init_weights, dtype=np.float64) if init_weights is not None else None,
+            min_decrease, max_iter,
+        ))
+    return _sc_weight_fw_numpy(Y, zeta, intercept, init_weights, min_decrease, max_iter)
+
+
+def _sc_weight_fw_numpy(
+    Y: np.ndarray,
+    zeta: float,
+    intercept: bool = True,
+    init_weights: Optional[np.ndarray] = None,
+    min_decrease: float = 1e-5,
+    max_iter: int = 10000,
+) -> np.ndarray:
+    """Pure NumPy implementation of Frank-Wolfe SC weight solver."""
+    T0 = Y.shape[1] - 1
+    N = Y.shape[0]
 
-    Notes
-    -----
-    The time weights help interpolate between DiD (uniform weights)
-    and synthetic control (weights concentrated on similar periods).
+    if T0 <= 0:
+        return np.ones(max(T0, 1))
+
+    # Column-center if using intercept (matches R's intercept=TRUE default)
+    if intercept:
+        Y = Y - Y.mean(axis=0)
+
+    A = Y[:, :T0]
+    b = Y[:, T0]
+    eta = N * zeta ** 2
+
+    if init_weights is not None:
+        lam = init_weights.copy()
+    else:
+        lam = np.ones(T0) / T0
+
+    vals = np.full(max_iter, np.nan)
+    for t in range(max_iter):
+        lam = _fw_step(A, lam, b, eta)
+        err = Y @ np.append(lam, -1.0)
+        vals[t] = zeta ** 2 * np.sum(lam ** 2) + np.sum(err ** 2) / N
+        if t >= 1 and vals[t - 1] - vals[t] < min_decrease ** 2:
+            break
+
+    return lam
+
+
+def _sparsify(v: np.ndarray) -> np.ndarray:
+    """Sparsify weight vector by zeroing out small entries.
+
+    Matches R's synthdid ``sparsify_function``:
+    ``v[v <= max(v)/4] = 0; v = v / sum(v)``
+
+    Parameters
+    ----------
+    v : np.ndarray
+        Weight vector.
+
+    Returns
+    -------
+    np.ndarray
+        Sparsified weight vector summing to 1.
+    """
+    v = v.copy()
+    max_v = np.max(v)
+    if max_v <= 0:
+        return np.ones(len(v)) / len(v)
+    v[v <= max_v / 4] = 0.0
+    return _sum_normalize(v)
+
+
+def compute_time_weights(
+    Y_pre_control: np.ndarray,
+    Y_post_control: np.ndarray,
+    zeta_lambda: float,
+    intercept: bool = True,
+    min_decrease: float = 1e-5,
+    max_iter_pre_sparsify: int = 100,
+    max_iter: int = 10000,
+) -> np.ndarray:
+    """Compute SDID time weights via Frank-Wolfe optimization.
+
+    Matches R's ``synthdid::sc.weight.fw(Yc[1:N0, ], zeta=zeta.lambda,
+    intercept=TRUE)`` where ``Yc`` is the collapsed-form matrix. Uses
+    two-pass optimization with sparsification (same as unit weights),
+    matching R's default ``sparsify=sparsify_function``.
+
+    Parameters
+    ----------
+    Y_pre_control : np.ndarray
+        Control outcomes in pre-treatment periods, shape (n_pre, n_control).
+    Y_post_control : np.ndarray
+        Control outcomes in post-treatment periods, shape (n_post, n_control).
+    zeta_lambda : float
+        Regularization parameter for time weights.
+    intercept : bool, default True
+        If True, column-center the optimization matrix.
+    min_decrease : float, default 1e-5
+        Convergence criterion for Frank-Wolfe. R uses ``1e-5 * noise_level``.
+    max_iter_pre_sparsify : int, default 100
+        Iterations for first pass (before sparsification).
+    max_iter : int, default 10000
+        Maximum iterations for second pass (after sparsification).
+        Matches R's default.
+
+    Returns
+    -------
+    np.ndarray
+        Time weights of shape (n_pre,) on the simplex.
     """
-    n_pre = len(Y_treated)
+    if HAS_RUST_BACKEND:
+        return np.asarray(_rust_compute_time_weights(
+            np.ascontiguousarray(Y_pre_control, dtype=np.float64),
+            np.ascontiguousarray(Y_post_control, dtype=np.float64),
+            zeta_lambda, intercept, min_decrease,
+            max_iter_pre_sparsify, max_iter,
+        ))
+
+    n_pre = Y_pre_control.shape[0]
 
     if n_pre <= 1:
-        return np.asarray(np.ones(n_pre))
+        return np.ones(n_pre)
+
+    # Build collapsed form: (N_co, T_pre + 1), last col = per-control post mean
+    post_means = np.mean(Y_post_control, axis=0)  # (N_co,)
+    Y_time = np.column_stack([Y_pre_control.T, post_means])  # (N_co, T_pre+1)
+
+    # First pass: limited iterations (matching R's max.iter.pre.sparsify)
+    lam = _sc_weight_fw(
+        Y_time,
+        zeta=zeta_lambda,
+        intercept=intercept,
+        min_decrease=min_decrease,
+        max_iter=max_iter_pre_sparsify,
+    )
 
-    # Compute mean control outcomes per period
-    control_means = np.mean(Y_control, axis=1)
+    # Sparsify: zero out small weights, renormalize (R's sparsify_function)
+    lam = _sparsify(lam)
+
+    # Second pass: from sparsified initialization (matching R's max.iter)
+    lam = _sc_weight_fw(
+        Y_time,
+        zeta=zeta_lambda,
+        intercept=intercept,
+        init_weights=lam,
+        min_decrease=min_decrease,
+        max_iter=max_iter,
+    )
 
-    # Compute differences from treated
-    diffs = np.abs(Y_treated - control_means)
+    return lam
 
-    # Inverse weighting: periods with smaller differences get higher weight
-    # Add regularization to prevent extreme weights
-    inv_diffs = 1.0 / (diffs + zeta * np.std(diffs) + _NUMERICAL_EPS)
 
-    # Normalize to sum to 1
-    weights = inv_diffs / np.sum(inv_diffs)
+def compute_sdid_unit_weights(
+    Y_pre_control: np.ndarray,
+    Y_pre_treated_mean: np.ndarray,
+    zeta_omega: float,
+    intercept: bool = True,
+    min_decrease: float = 1e-5,
+    max_iter_pre_sparsify: int = 100,
+    max_iter: int = 10000,
+) -> np.ndarray:
+    """Compute SDID unit weights via Frank-Wolfe with two-pass sparsification.
 
-    return np.asarray(weights)
+    Matches R's ``synthdid::sc.weight.fw(t(Yc[, 1:T0]), zeta=zeta.omega,
+    intercept=TRUE)`` followed by the sparsify/re-optimize pass.
+
+    Parameters
+    ----------
+    Y_pre_control : np.ndarray
+        Control outcomes in pre-treatment periods, shape (n_pre, n_control).
+    Y_pre_treated_mean : np.ndarray
+        Mean treated outcomes in pre-treatment periods, shape (n_pre,).
+    zeta_omega : float
+        Regularization parameter for unit weights.
+    intercept : bool, default True
+        If True, column-center the optimization matrix.
+    min_decrease : float, default 1e-5
+        Convergence criterion for Frank-Wolfe. R uses ``1e-5 * noise_level``.
+    max_iter_pre_sparsify : int, default 100
+        Iterations for first pass (before sparsification).
+    max_iter : int, default 10000
+        Iterations for second pass (after sparsification). Matches R's default.
+
+    Returns
+    -------
+    np.ndarray
+        Unit weights of shape (n_control,) on the simplex.
+    """
+    n_control = Y_pre_control.shape[1]
+
+    if n_control == 0:
+        return np.asarray([])
+    if n_control == 1:
+        return np.asarray([1.0])
+
+    if HAS_RUST_BACKEND:
+        return np.asarray(_rust_sdid_unit_weights(
+            np.ascontiguousarray(Y_pre_control, dtype=np.float64),
+            np.ascontiguousarray(Y_pre_treated_mean, dtype=np.float64),
+            zeta_omega, intercept, min_decrease,
+            max_iter_pre_sparsify, max_iter,
+        ))
+
+    # Build collapsed form: (T_pre, N_co + 1), last col = treated pre means
+    Y_unit = np.column_stack([Y_pre_control, Y_pre_treated_mean.reshape(-1, 1)])
+
+    # First pass: limited iterations
+    omega = _sc_weight_fw(
+        Y_unit,
+        zeta=zeta_omega,
+        intercept=intercept,
+        max_iter=max_iter_pre_sparsify,
+        min_decrease=min_decrease,
+    )
+
+    # Sparsify: zero out weights <= max/4, renormalize
+    omega = _sparsify(omega)
+
+    # Second pass: from sparsified initialization
+    omega = _sc_weight_fw(
+        Y_unit,
+        zeta=zeta_omega,
+        intercept=intercept,
+        init_weights=omega,
+        max_iter=max_iter,
+        min_decrease=min_decrease,
+    )
+
+    return omega
 
 
 def compute_sdid_estimator(
diff --git a/docs/methodology/REGISTRY.md b/docs/methodology/REGISTRY.md
index 52f5e6a3..b15ebef8 100644
--- a/docs/methodology/REGISTRY.md
+++ b/docs/methodology/REGISTRY.md
@@ -572,42 +572,107 @@ Y_it = alpha_i + beta_t [+ X'_it * delta] + W'_it * gamma + epsilon_it
 τ̂^sdid = Σ_t λ_t (Ȳ_{tr,t} - Σ_j ω_j Y_{j,t})
 ```
 
-Unit weights ω solve:
+where Ȳ_{tr,t} is the mean treated outcome at time t, ω_j are unit weights, and λ_t are time weights.
+
+*Unit weights ω (Frank-Wolfe on collapsed form):*
+
+Build collapsed-form matrix Y_unit of shape (T_pre, N_co + 1), where the last column is the mean treated pre-period outcomes. Solve via Frank-Wolfe on the simplex:
+
 ```
-min_ω ||Ȳ_{tr,pre} - Σ_j ω_j Y_{j,pre}||₂² + ζ² ||ω||₂²
-s.t. ω ≥ 0, Σ_j ω_j = 1
+min_{ω on simplex}  ζ_ω² ||ω||₂² + (1/T_pre) ||A_centered ω - b_centered||₂²
 ```
 
-Time weights λ solve analogous problem matching pre/post means.
+where A = Y_unit[:, :N_co], b = Y_unit[:, N_co], and centering is column-wise (intercept=True).
+
+**Two-pass sparsification procedure** (matches R's `synthdid::sc.weight.fw` + `sparsify_function`):
+1. First pass: Run Frank-Wolfe for 100 iterations (max_iter_pre_sparsify) from uniform initialization
+2. Sparsify: `v[v <= max(v)/4] = 0; v = v / sum(v)` (zero out small weights, renormalize)
+3. Second pass: Run Frank-Wolfe for 1000 iterations (max_iter) starting from sparsified weights
+
+The sparsification step concentrates weights on the most important control units, improving interpretability and stability.
+
+*Time weights λ (Frank-Wolfe on collapsed form):*
+
+Build collapsed-form matrix Y_time of shape (N_co, T_pre + 1), where the last column is the per-control post-period mean (averaged across post-periods for each control unit). Solve:
 
-Regularization parameter:
 ```
-ζ = (N_tr × T_post)^(1/4) × σ̂
+min_{λ on simplex}  ζ_λ² ||λ||₂² + (1/N_co) ||A_centered λ - b_centered||₂²
 ```
-where σ̂ is estimated noise level.
 
-*Standard errors:*
-- Default: Placebo variance estimator (Algorithm 4 in paper)
+where A = Y_time[:, :T_pre], b = Y_time[:, T_pre], and centering is column-wise.
+
+*Auto-regularization (matching R's synthdid):*
 ```
-V̂ = ((r-1)/r) × Var({τ̂^(j) : j ∈ controls})
+noise_level = sd(first_differences of control outcomes)   # pooled across units
+zeta_omega  = (N_treated × T_post)^(1/4) × noise_level
+zeta_lambda = 1e-6 × noise_level
 ```
-where τ̂^(j) is placebo estimate treating unit j as treated
-- Alternative: Block bootstrap
+
+The noise level is computed as the standard deviation (ddof=1) of `np.diff(Y_pre_control, axis=0)`,
+which computes first-differences across time for each control unit and pools all values.
+This matches R's `sd(apply(Y[1:N0, 1:T0], 1, diff))`.
+
+*Frank-Wolfe step (matches R's `fw.step()`):*
+```
+half_grad = A' (A x - b) + η x        # η = N × ζ²
+i = argmin(half_grad)                   # vertex selection (simplex corner)
+d_x = e_i - x                          # direction toward vertex i
+step = -(half_grad · d_x) / (||A d_x||² + η ||d_x||²)
+step = clip(step, 0, 1)
+x_new = x + step × d_x
+```
+
+Convergence criterion: stop when objective decrease < min_decrease² (default min_decrease=1e-3).
+
+*Standard errors:*
+
+- Default: Placebo variance estimator (Algorithm 4 in paper)
+  1. Randomly permute control unit indices
+  2. Split into pseudo-controls (first N_co - N_tr) and pseudo-treated (last N_tr)
+  3. Renormalize original unit weights for pseudo-controls: `ω_pseudo = _sum_normalize(ω[pseudo_control_idx])`
+  4. Compute SDID estimate with renormalized weights and **fixed** time weights (no re-estimation)
+  5. Repeat `replications` times (default 200)
+  6. `SE = sqrt((r-1)/r) × sd(placebo_estimates)` where r = number of successful replications
+
+  This matches R's `synthdid::vcov(method="placebo")`.
+
+- Alternative: Bootstrap at unit level (matching R's `synthdid::vcov(method="bootstrap")`)
+  1. Resample ALL units (control + treated) with replacement
+  2. Identify which resampled units are control vs treated
+  3. Renormalize original unit weights for resampled controls: `ω_boot = _sum_normalize(ω[boot_control_idx])`
+  4. Time weights λ remain **unchanged** from original estimation (fixed weights)
+  5. Compute SDID estimate with renormalized ω and original λ
+  6. `SE = sd(bootstrap_estimates, ddof=1)`
 
 *Edge cases:*
-- Negative weights attempted: projected onto simplex
-- Perfect pre-treatment fit: regularization prevents overfitting
-- Single treated unit: valid, uses jackknife-style variance
+- **Frank-Wolfe non-convergence**: Returns current weights after max_iter iterations. No warning emitted; the convergence check `vals[t-1] - vals[t] < min_decrease²` simply does not trigger early exit, and the final iterate is returned.
+- **`_sparsify` all-zero input**: If `max(v) <= 0`, returns uniform weights `ones(len(v)) / len(v)`.
+- **Single control unit**: `compute_sdid_unit_weights` returns `[1.0]` immediately (short-circuit before Frank-Wolfe).
+- **Zero control units**: `compute_sdid_unit_weights` returns empty array `[]`.
+- **Single pre-period**: `compute_time_weights` returns `[1.0]` when `n_pre <= 1` (Frank-Wolfe on a 1-element simplex is trivial).
+- **Bootstrap with 0 control or 0 treated in resample**: Skip iteration (`continue`). If ALL bootstrap iterations fail, raises `ValueError`. If only 1 succeeds, warns and returns SE=0.0. If >5% failure rate, warns about reliability.
+- **Placebo with n_control <= n_treated**: Warns that not enough control units for placebo variance estimation, returns SE=0.0 and empty placebo effects array. The check is `n_control - n_treated < 1`.
+- **Negative weights attempted**: Frank-Wolfe operates on the simplex (non-negative, sum-to-1), so weights are always feasible by construction. The step size is clipped to [0, 1] and the move is toward a simplex vertex.
+- **Perfect pre-treatment fit**: Regularization (ζ² ||ω||²) prevents overfitting by penalizing weight concentration.
+- **Single treated unit**: Valid; placebo variance uses jackknife-style permutations of controls.
+- **Noise level with < 2 pre-periods**: Returns 0.0, which makes both zeta_omega and zeta_lambda equal to 0.0 (no regularization).
+- **NaN inference for undefined statistics**: t_stat uses NaN when SE is zero or non-finite; p_value and CI also NaN. Matches CallawaySantAnna NaN convention.
+- **Placebo p-value floor**: `p_value = max(empirical_p, 1/(n_replications + 1))` to avoid reporting exactly zero.
 
 **Reference implementation(s):**
 - R: `synthdid::synthdid_estimate()` (Arkhangelsky et al.'s official package)
+- Key R functions matched: `sc.weight.fw()` (Frank-Wolfe), `sparsify_function` (sparsification), `vcov.synthdid_estimate()` (variance)
 
 **Requirements checklist:**
-- [ ] Unit weights: sum to 1, non-negative (simplex constraint)
-- [ ] Time weights: sum to 1, non-negative (simplex constraint)
-- [ ] Placebo SE formula: `sqrt((r-1)/r) * sd(placebo_estimates)`
-- [ ] Regularization scales with panel dimensions
-- [ ] Returns both unit and time weights for interpretation
+- [x] Unit weights: Frank-Wolfe on collapsed form (T_pre, N_co+1), two-pass sparsification (100 iters -> sparsify -> 1000 iters)
+- [x] Time weights: Frank-Wolfe on collapsed form (N_co, T_pre+1), last column = per-control post mean
+- [x] Unit and time weights: sum to 1, non-negative (simplex constraint)
+- [x] Auto-regularization: noise_level = sd(first_diffs), zeta_omega = (N1*T1)^0.25 * noise_level, zeta_lambda = 1e-6 * noise_level
+- [x] Sparsification: v[v <= max(v)/4] = 0; v = v/sum(v)
+- [x] Placebo SE formula: sqrt((r-1)/r) * sd(placebo_estimates)
+- [x] Bootstrap: fixed weights (original lambda unchanged, omega renormalized for resampled controls)
+- [x] Returns both unit and time weights for interpretation
+- [x] Column centering (intercept=True) in Frank-Wolfe optimization
 
 ---
 
@@ -1182,7 +1247,7 @@ should be a deliberate user choice.
 | CallawaySantAnna | Analytical (influence fn) | Multiplier bootstrap |
 | SunAbraham | Cluster-robust + delta method | Pairs bootstrap |
 | ImputationDiD | Conservative clustered (Thm 3) | Multiplier bootstrap (library extension; percentile CIs and empirical p-values, consistent with CS/SA) |
-| SyntheticDiD | Placebo variance (Alg 4) | Block bootstrap |
+| SyntheticDiD | Placebo variance (Alg 4) | Unit-level bootstrap (fixed weights) |
 | TripleDifference | HC1 / cluster-robust | Influence function for IPW/DR |
 | TROP | Block bootstrap | — |
 | BaconDecomposition | N/A (exact decomposition) | Individual 2×2 SEs |
diff --git a/docs/tutorials/03_synthetic_did.ipynb b/docs/tutorials/03_synthetic_did.ipynb
index b5833e56..8c7c22ce 100644
--- a/docs/tutorials/03_synthetic_did.ipynb
+++ b/docs/tutorials/03_synthetic_did.ipynb
@@ -389,14 +389,7 @@
   {
    "cell_type": "markdown",
    "metadata": {},
-   "source": [
-    "## 7. Inference Methods\n",
-    "\n",
-    "SDID supports two inference methods:\n",
-    "\n",
-    "1. **Bootstrap** (`variance_method=\"bootstrap\"`): Block bootstrap at unit level (default)\n",
-    "2. **Placebo** (`variance_method=\"placebo\"`): Placebo-based variance using Algorithm 4 from Arkhangelsky et al. (2021)"
-   ]
+   "source": "## 7. Inference Methods\n\nSDID supports two inference methods:\n\n1. **Placebo** (`variance_method=\"placebo\"`, default): Placebo-based variance using Algorithm 4 from Arkhangelsky et al. (2021). This matches R's default.\n2. **Bootstrap** (`variance_method=\"bootstrap\"`): Unit-level bootstrap with fixed weights matching R's `bootstrap_sample`"
   },
   {
    "cell_type": "code",
@@ -453,56 +446,14 @@
   {
    "cell_type": "markdown",
    "metadata": {},
-   "source": [
-    "## 8. Tuning Regularization\n",
-    "\n",
-    "SDID has two regularization parameters:\n",
-    "\n",
-    "- `lambda_reg`: Regularization for unit weights (higher = more uniform)\n",
-    "- `zeta`: Regularization for time weights (higher = more uniform)"
-   ]
+   "source": "## 8. Tuning Regularization\n\nBy default, SDID **auto-computes** regularization from the data noise level, matching R's `synthdid` package:\n\n- `zeta_omega`: Unit weight regularization = `(N1 * T1)^0.25 * noise_level`\n- `zeta_lambda`: Time weight regularization = `1e-6 * noise_level`\n\nYou can override these with explicit values:"
   },
   {
    "cell_type": "code",
    "execution_count": null,
    "metadata": {},
    "outputs": [],
-   "source": [
-    "# Compare different regularization levels\n",
-    "results_list = []\n",
-    "\n",
-    "for lambda_reg in [0.0, 1.0, 10.0]:\n",
-    "    sdid_reg = SyntheticDiD(\n",
-    "        lambda_reg=lambda_reg,\n",
-    "        variance_method=\"placebo\",\n",
-    "        n_bootstrap=200,\n",
-    "        seed=42\n",
-    "    )\n",
-    "    \n",
-    "    res = sdid_reg.fit(\n",
-    "        df,\n",
-    "        outcome=\"outcome\",\n",
-    "        treatment=\"treated\",\n",
-    "        unit=\"unit\",\n",
-    "        time=\"period\",\n",
-    "        post_periods=list(range(n_pre, n_periods))\n",
-    "    )\n",
-    "    \n",
-    "    weights = list(res.unit_weights.values())\n",
-    "    eff_n = 1 / sum(w**2 for w in weights) if sum(w**2 for w in weights) > 0 else 0\n",
-    "    \n",
-    "    results_list.append({\n",
-    "        'lambda_reg': lambda_reg,\n",
-    "        'ATT': res.att,\n",
-    "        'SE': res.se,\n",
-    "        'Eff. N controls': eff_n,\n",
-    "        'Pre-fit RMSE': res.pre_treatment_fit\n",
-    "    })\n",
-    "\n",
-    "reg_df = pd.DataFrame(results_list)\n",
-    "print(\"Effect of unit weight regularization:\")\n",
-    "print(reg_df.to_string(index=False))"
-   ]
+   "source": "# Compare different unit weight regularization levels\nresults_list = []\n\nfor zeta_omega in [0.01, 1.0, 100.0]:\n    sdid_reg = SyntheticDiD(\n        zeta_omega=zeta_omega,\n        variance_method=\"placebo\",\n        n_bootstrap=200,\n        seed=42\n    )\n    \n    res = sdid_reg.fit(\n        df,\n        outcome=\"outcome\",\n        treatment=\"treated\",\n        unit=\"unit\",\n        time=\"period\",\n        post_periods=list(range(n_pre, n_periods))\n    )\n    \n    weights = list(res.unit_weights.values())\n    eff_n = 1 / sum(w**2 for w in weights) if sum(w**2 for w in weights) > 0 else 0\n    \n    results_list.append({\n        'zeta_omega': zeta_omega,\n        'ATT': res.att,\n        'SE': res.se,\n        'Eff. N controls': eff_n,\n        'Pre-fit RMSE': res.pre_treatment_fit\n    })\n\nreg_df = pd.DataFrame(results_list)\nprint(\"Effect of unit weight regularization:\")\nprint(reg_df.to_string(index=False))"
   },
   {
    "cell_type": "markdown",
@@ -595,23 +546,7 @@
   {
    "cell_type": "markdown",
    "metadata": {},
-   "source": [
-    "## Summary\n",
-    "\n",
-    "Key takeaways for Synthetic DiD:\n",
-    "\n",
-    "1. **Best use cases**: Few treated units, many controls, long pre-period\n",
-    "2. **Unit weights**: Identify which controls are most similar to treated\n",
-    "3. **Time weights**: Determine which pre-periods are most informative\n",
-    "4. **Pre-treatment fit**: Lower RMSE indicates better synthetic match\n",
-    "5. **Inference options**:\n",
-    "   - Bootstrap (`variance_method=\"bootstrap\"`): Block bootstrap at unit level (default)\n",
-    "   - Placebo (`variance_method=\"placebo\"`): Placebo-based variance from controls\n",
-    "6. **Regularization**: Higher values give more uniform weights\n",
-    "\n",
-    "Reference:\n",
-    "- Arkhangelsky, D., Athey, S., Hirshberg, D. A., Imbens, G. W., & Wager, S. (2021). Synthetic difference-in-differences. American Economic Review, 111(12), 4088-4118."
-   ]
+   "source": "## Summary\n\nKey takeaways for Synthetic DiD:\n\n1. **Best use cases**: Few treated units, many controls, long pre-period\n2. **Unit weights**: Identify which controls are most similar to treated (Frank-Wolfe with sparsification)\n3. **Time weights**: Determine which pre-periods are most informative (Frank-Wolfe on collapsed form)\n4. **Pre-treatment fit**: Lower RMSE indicates better synthetic match\n5. **Inference options**:\n   - Placebo (`variance_method=\"placebo\"`, default): Placebo-based variance from controls (matches R)\n   - Bootstrap (`variance_method=\"bootstrap\"`): Unit-level bootstrap with fixed weights\n6. **Regularization**: Auto-computed from data noise level by default. Override with `zeta_omega`/`zeta_lambda`.\n\nReference:\n- Arkhangelsky, D., Athey, S., Hirshberg, D. A., Imbens, G. W., & Wager, S. (2021). Synthetic difference-in-differences. American Economic Review, 111(12), 4088-4118."
   }
  ],
  "metadata": {
@@ -621,4 +556,4 @@
  },
  "nbformat": 4,
  "nbformat_minor": 4
-}
+}
\ No newline at end of file
diff --git a/rust/src/lib.rs b/rust/src/lib.rs
index e4ed7df8..e7c232c1 100644
--- a/rust/src/lib.rs
+++ b/rust/src/lib.rs
@@ -7,6 +7,7 @@ use pyo3::prelude::*;
 
 mod bootstrap;
 mod linalg;
+mod sdid_variance;
 mod trop;
 mod weights;
 
@@ -19,10 +20,16 @@ fn _rust_backend(m: &Bound<'_, PyModule>) -> PyResult<()> {
         m
     )?)?;
 
-    // Synthetic control weights
+    // Synthetic control weights (legacy projected gradient descent)
     m.add_function(wrap_pyfunction!(weights::compute_synthetic_weights, m)?)?;
     m.add_function(wrap_pyfunction!(weights::project_simplex, m)?)?;
 
+    // SDID weights (Frank-Wolfe matching R's synthdid)
+    m.add_function(wrap_pyfunction!(weights::compute_sdid_unit_weights, m)?)?;
+    m.add_function(wrap_pyfunction!(weights::compute_time_weights, m)?)?;
+    m.add_function(wrap_pyfunction!(weights::compute_noise_level, m)?)?;
+    m.add_function(wrap_pyfunction!(weights::sc_weight_fw, m)?)?;
+
     // Linear algebra operations
     m.add_function(wrap_pyfunction!(linalg::solve_ols, m)?)?;
     m.add_function(wrap_pyfunction!(linalg::compute_robust_vcov, m)?)?;
@@ -36,6 +43,10 @@ fn _rust_backend(m: &Bound<'_, PyModule>) -> PyResult<()> {
     m.add_function(wrap_pyfunction!(trop::loocv_grid_search_joint, m)?)?;
     m.add_function(wrap_pyfunction!(trop::bootstrap_trop_variance_joint, m)?)?;
 
+    // SDID variance estimation (parallel placebo and bootstrap)
+    m.add_function(wrap_pyfunction!(sdid_variance::placebo_variance_sdid, m)?)?;
+    m.add_function(wrap_pyfunction!(sdid_variance::bootstrap_variance_sdid, m)?)?;
+
     // Version info
     m.add("__version__", env!("CARGO_PKG_VERSION"))?;
 
diff --git a/rust/src/sdid_variance.rs b/rust/src/sdid_variance.rs
new file mode 100644
index 00000000..c08bdd7a
--- /dev/null
+++ b/rust/src/sdid_variance.rs
@@ -0,0 +1,496 @@
+//! SDID variance estimation acceleration.
+//!
+//! This module provides parallelized implementations of:
+//! - Placebo-based variance estimation (Algorithm 4, Arkhangelsky et al. 2021)
+//! - Bootstrap variance estimation with fixed weights
+//!
+//! Both functions parallelize across replications using rayon, providing
+//! near-linear speedup on multi-core machines (e.g., ~8x on 8 cores).
+//!
+//! Reference:
+//! Arkhangelsky, D., Athey, S., Hirshberg, D. A., Imbens, G. W., & Wager, S.
+//! (2021). Synthetic Difference-in-Differences. American Economic Review,
+//! 111(12), 4088-4118.
+
+use ndarray::{Array1, Array2, Axis};
+use numpy::{PyArray1, PyReadonlyArray1, PyReadonlyArray2, ToPyArray};
+use pyo3::prelude::*;
+use rayon::prelude::*;
+
+use crate::weights;
+
+/// Fisher-Yates permutation of 0..n using the provided RNG.
+fn fisher_yates_permutation(rng: &mut impl rand::Rng, n: usize) -> Vec<usize> {
+    let mut perm: Vec<usize> = (0..n).collect();
+    for i in (1..n).rev() {
+        let j = rng.gen_range(0..=i);
+        perm.swap(i, j);
+    }
+    perm
+}
+
+/// Extract columns from a matrix by index.
+fn extract_submatrix_cols(matrix: &Array2<f64>, col_indices: &[usize]) -> Array2<f64> {
+    let n_rows = matrix.nrows();
+    let n_cols = col_indices.len();
+    let mut result = Array2::zeros((n_rows, n_cols));
+    for (new_j, &old_j) in col_indices.iter().enumerate() {
+        for i in 0..n_rows {
+            result[[i, new_j]] = matrix[[i, old_j]];
+        }
+    }
+    result
+}
+
+/// Compute column means for selected columns.
+fn column_means(matrix: &Array2<f64>, col_indices: &[usize]) -> Array1<f64> {
+    let n_rows = matrix.nrows();
+    let n_cols = col_indices.len();
+    if n_cols == 0 {
+        return Array1::zeros(n_rows);
+    }
+    let mut means = Array1::zeros(n_rows);
+    for &j in col_indices {
+        for i in 0..n_rows {
+            means[i] += matrix[[i, j]];
+        }
+    }
+    means /= n_cols as f64;
+    means
+}
+
+/// Compute the SDID estimator (ATT) from pre/post control/treated data and weights.
+///
+/// Matches `compute_sdid_estimator` in Python's `utils.py:1587-1604`:
+///
+///     τ̂ = (Ȳ_treated,post - Σ_t λ_t * Y_treated,t)
+///         - Σ_j ω_j * (Ȳ_j,post - Σ_t λ_t * Y_j,t)
+fn sdid_estimator_internal(
+    y_pre_control: &Array2<f64>,
+    y_post_control: &Array2<f64>,
+    y_pre_treated_mean: &Array1<f64>,
+    y_post_treated_mean: &Array1<f64>,
+    unit_weights: &Array1<f64>,
+    time_weights: &Array1<f64>,
+) -> f64 {
+    // Weighted pre-treatment averages
+    // time_weights @ Y_pre_control -> (n_control,)
+    let weighted_pre_control = time_weights.dot(&y_pre_control.view());
+    // time_weights @ Y_pre_treated_mean -> scalar
+    let weighted_pre_treated = time_weights.dot(y_pre_treated_mean);
+
+    // Post-treatment averages
+    let mean_post_control = y_post_control.mean_axis(Axis(0)).unwrap();
+    let mean_post_treated = y_post_treated_mean.mean().unwrap();
+
+    // DiD for treated: post - weighted pre
+    let did_treated = mean_post_treated - weighted_pre_treated;
+
+    // Weighted DiD for controls: sum over j of omega_j * (post_j - weighted_pre_j)
+    let diff_control = &mean_post_control - &weighted_pre_control;
+    let did_control = unit_weights.dot(&diff_control);
+
+    // SDID estimator
+    did_treated - did_control
+}
+
+/// Compute placebo-based variance for SDID in parallel.
+///
+/// Implements Algorithm 4 from Arkhangelsky et al. (2021), matching R's
+/// `synthdid::vcov(method = "placebo")`:
+///
+/// 1. Randomly permute control indices
+/// 2. Split into pseudo-controls and pseudo-treated
+/// 3. Re-estimate both omega and lambda on the permuted data
+/// 4. Compute SDID estimate with re-estimated weights
+/// 5. Repeat `replications` times (in parallel)
+/// 6. SE = sqrt((r-1)/r) * sd(estimates)
+///
+/// # Arguments
+/// * `y_pre_control` - Control outcomes in pre-treatment periods (n_pre, n_control)
+/// * `y_post_control` - Control outcomes in post-treatment periods (n_post, n_control)
+/// * `y_pre_treated_mean` - Mean treated outcomes in pre-treatment (n_pre,)
+/// * `y_post_treated_mean` - Mean treated outcomes in post-treatment (n_post,)
+/// * `n_treated` - Number of treated units in the original estimation
+/// * `zeta_omega` - Regularization parameter for unit weights
+/// * `zeta_lambda` - Regularization parameter for time weights
+/// * `min_decrease` - Convergence threshold for Frank-Wolfe
+/// * `intercept` - Column-center if true (default: true)
+/// * `max_iter_pre_sparsify` - Iterations for first pass (default: 100)
+/// * `max_iter` - Iterations for second pass (default: 10000)
+/// * `replications` - Number of placebo replications
+/// * `seed` - Random seed for reproducibility
+///
+/// # Returns
+/// (se, placebo_estimates) where se is the standard error and
+/// placebo_estimates is the array of successful placebo effects.
+#[pyfunction]
+#[pyo3(signature = (y_pre_control, y_post_control, y_pre_treated_mean, y_post_treated_mean,
+                     n_treated, zeta_omega, zeta_lambda, min_decrease,
+                     intercept=true, max_iter_pre_sparsify=100, max_iter=10000,
+                     replications=200, seed=42))]
+#[allow(clippy::too_many_arguments)]
+pub fn placebo_variance_sdid<'py>(
+    py: Python<'py>,
+    y_pre_control: PyReadonlyArray2<'py, f64>,
+    y_post_control: PyReadonlyArray2<'py, f64>,
+    y_pre_treated_mean: PyReadonlyArray1<'py, f64>,
+    y_post_treated_mean: PyReadonlyArray1<'py, f64>,
+    n_treated: usize,
+    zeta_omega: f64,
+    zeta_lambda: f64,
+    min_decrease: f64,
+    intercept: bool,
+    max_iter_pre_sparsify: usize,
+    max_iter: usize,
+    replications: usize,
+    seed: u64,
+) -> PyResult<(f64, Bound<'py, PyArray1<f64>>)> {
+    // Convert to owned arrays for Send across threads
+    let y_pre_c = y_pre_control.as_array().to_owned();
+    let y_post_c = y_post_control.as_array().to_owned();
+    let _y_pre_t_mean = y_pre_treated_mean.as_array().to_owned();
+    let _y_post_t_mean = y_post_treated_mean.as_array().to_owned();
+
+    let n_control = y_pre_c.ncols();
+
+    // Check if we have enough controls for the split
+    let n_pseudo_control = n_control.saturating_sub(n_treated);
+    if n_pseudo_control < 1 {
+        let empty = Array1::<f64>::zeros(0);
+        return Ok((0.0, empty.to_pyarray_bound(py)));
+    }
+
+    // Parallel loop over replications
+    let placebo_estimates: Vec<f64> = (0..replications)
+        .into_par_iter()
+        .filter_map(|b| {
+            use rand::prelude::*;
+            use rand_xoshiro::Xoshiro256PlusPlus;
+
+            let mut rng = Xoshiro256PlusPlus::seed_from_u64(seed.wrapping_add(b as u64));
+
+            // Generate random permutation of control indices
+            let perm = fisher_yates_permutation(&mut rng, n_control);
+
+            // Split into pseudo-controls and pseudo-treated
+            let pseudo_control_idx = &perm[..n_pseudo_control];
+            let pseudo_treated_idx = &perm[n_pseudo_control..];
+
+            // Extract submatrices
+            let y_pre_pseudo_control = extract_submatrix_cols(&y_pre_c, pseudo_control_idx);
+            let y_post_pseudo_control = extract_submatrix_cols(&y_post_c, pseudo_control_idx);
+            let y_pre_pseudo_treated_mean = column_means(&y_pre_c, pseudo_treated_idx);
+            let y_post_pseudo_treated_mean = column_means(&y_post_c, pseudo_treated_idx);
+
+            // Re-estimate unit weights on permuted data
+            let pseudo_omega = weights::compute_sdid_unit_weights_internal(
+                &y_pre_pseudo_control.view(),
+                &y_pre_pseudo_treated_mean.view(),
+                zeta_omega,
+                intercept,
+                min_decrease,
+                max_iter_pre_sparsify,
+                max_iter,
+            );
+
+            // Re-estimate time weights on permuted data
+            let pseudo_lambda = weights::compute_time_weights_internal(
+                &y_pre_pseudo_control.view(),
+                &y_post_pseudo_control.view(),
+                zeta_lambda,
+                intercept,
+                min_decrease,
+                max_iter_pre_sparsify,
+                max_iter,
+            );
+
+            // Compute placebo SDID estimate
+            let tau = sdid_estimator_internal(
+                &y_pre_pseudo_control,
+                &y_post_pseudo_control,
+                &y_pre_pseudo_treated_mean,
+                &y_post_pseudo_treated_mean,
+                &pseudo_omega,
+                &pseudo_lambda,
+            );
+
+            if tau.is_finite() {
+                Some(tau)
+            } else {
+                None
+            }
+        })
+        .collect();
+
+    let n_successful = placebo_estimates.len();
+
+    // Compute SE: sqrt((r-1)/r) * sd(estimates, ddof=1) matching R's formula
+    let se = if n_successful < 2 {
+        0.0
+    } else {
+        let n = n_successful as f64;
+        let mean = placebo_estimates.iter().sum::<f64>() / n;
+        let variance = placebo_estimates
+            .iter()
+            .map(|x| (x - mean).powi(2))
+            .sum::<f64>()
+            / (n - 1.0);
+        ((n - 1.0) / n).sqrt() * variance.sqrt()
+    };
+
+    let estimates_arr = Array1::from_vec(placebo_estimates);
+    Ok((se, estimates_arr.to_pyarray_bound(py)))
+}
+
+/// Compute bootstrap variance for SDID in parallel.
+///
+/// Resamples all units (control + treated) with replacement, renormalizes
+/// original unit weights for the resampled controls, and computes the
+/// SDID estimator with **fixed** weights (no re-estimation).
+///
+/// This matches R's `synthdid::vcov(method="bootstrap")`.
+///
+/// # Arguments
+/// * `y_pre_control` - Control outcomes in pre-treatment (n_pre, n_control)
+/// * `y_post_control` - Control outcomes in post-treatment (n_post, n_control)
+/// * `y_pre_treated` - Treated outcomes in pre-treatment (n_pre, n_treated)
+/// * `y_post_treated` - Treated outcomes in post-treatment (n_post, n_treated)
+/// * `unit_weights` - Original unit weights (n_control,)
+/// * `time_weights` - Original time weights (n_pre,)
+/// * `n_bootstrap` - Number of bootstrap iterations
+/// * `seed` - Random seed
+///
+/// # Returns
+/// (se, bootstrap_estimates, n_failed)
+#[pyfunction]
+#[pyo3(signature = (y_pre_control, y_post_control, y_pre_treated, y_post_treated,
+                     unit_weights, time_weights, n_bootstrap, seed))]
+#[allow(clippy::too_many_arguments)]
+pub fn bootstrap_variance_sdid<'py>(
+    py: Python<'py>,
+    y_pre_control: PyReadonlyArray2<'py, f64>,
+    y_post_control: PyReadonlyArray2<'py, f64>,
+    y_pre_treated: PyReadonlyArray2<'py, f64>,
+    y_post_treated: PyReadonlyArray2<'py, f64>,
+    unit_weights: PyReadonlyArray1<'py, f64>,
+    time_weights: PyReadonlyArray1<'py, f64>,
+    n_bootstrap: usize,
+    seed: u64,
+) -> PyResult<(f64, Bound<'py, PyArray1<f64>>, usize)> {
+    // Convert to owned arrays for Send across threads
+    let y_pre_c = y_pre_control.as_array().to_owned();
+    let y_post_c = y_post_control.as_array().to_owned();
+    let y_pre_t = y_pre_treated.as_array().to_owned();
+    let y_post_t = y_post_treated.as_array().to_owned();
+    let omega = unit_weights.as_array().to_owned();
+    let lambda = time_weights.as_array().to_owned();
+
+    let n_control = y_pre_c.ncols();
+    let n_treated = y_pre_t.ncols();
+    let n_total = n_control + n_treated;
+    let n_pre = y_pre_c.nrows();
+
+    // Build full panel: (n_pre+n_post, n_control+n_treated)
+    let n_post = y_post_c.nrows();
+    let n_times = n_pre + n_post;
+    let mut y_full = Array2::zeros((n_times, n_total));
+    for t in 0..n_pre {
+        for j in 0..n_control {
+            y_full[[t, j]] = y_pre_c[[t, j]];
+        }
+        for j in 0..n_treated {
+            y_full[[t, n_control + j]] = y_pre_t[[t, j]];
+        }
+    }
+    for t in 0..n_post {
+        for j in 0..n_control {
+            y_full[[n_pre + t, j]] = y_post_c[[t, j]];
+        }
+        for j in 0..n_treated {
+            y_full[[n_pre + t, n_control + j]] = y_post_t[[t, j]];
+        }
+    }
+
+    // Parallel bootstrap loop
+    let bootstrap_estimates: Vec<f64> = (0..n_bootstrap)
+        .into_par_iter()
+        .filter_map(|b| {
+            use rand::prelude::*;
+            use rand_xoshiro::Xoshiro256PlusPlus;
+
+            let mut rng = Xoshiro256PlusPlus::seed_from_u64(seed.wrapping_add(b as u64));
+
+            // Resample all units with replacement
+            let boot_idx: Vec<usize> = (0..n_total)
+                .map(|_| rng.gen_range(0..n_total))
+                .collect();
+
+            // Identify control vs treated in resampled set
+            let mut boot_control_idx = Vec::new();
+            let mut boot_treated_idx = Vec::new();
+            for &idx in &boot_idx {
+                if idx < n_control {
+                    boot_control_idx.push(idx);
+                } else {
+                    boot_treated_idx.push(idx);
+                }
+            }
+
+            // Skip degenerate samples
+            if boot_control_idx.is_empty() || boot_treated_idx.is_empty() {
+                return None;
+            }
+
+            // Renormalize unit weights for resampled controls
+            let boot_omega_raw: Array1<f64> =
+                Array1::from_iter(boot_control_idx.iter().map(|&i| omega[i]));
+            let boot_omega = weights::sum_normalize_internal(&boot_omega_raw);
+
+            let n_boot_control = boot_control_idx.len();
+            let n_boot_treated = boot_treated_idx.len();
+
+            // Extract resampled submatrices
+            let mut y_boot_pre_c = Array2::zeros((n_pre, n_boot_control));
+            let mut y_boot_post_c = Array2::zeros((n_post, n_boot_control));
+            for (new_j, &old_j) in boot_control_idx.iter().enumerate() {
+                for t in 0..n_pre {
+                    y_boot_pre_c[[t, new_j]] = y_full[[t, old_j]];
+                }
+                for t in 0..n_post {
+                    y_boot_post_c[[t, new_j]] = y_full[[n_pre + t, old_j]];
+                }
+            }
+
+            // Compute treated means for resampled treated units
+            let mut y_boot_pre_t_mean = Array1::zeros(n_pre);
+            let mut y_boot_post_t_mean = Array1::zeros(n_post);
+            for &old_j in &boot_treated_idx {
+                for t in 0..n_pre {
+                    y_boot_pre_t_mean[t] += y_full[[t, old_j]];
+                }
+                for t in 0..n_post {
+                    y_boot_post_t_mean[t] += y_full[[n_pre + t, old_j]];
+                }
+            }
+            y_boot_pre_t_mean /= n_boot_treated as f64;
+            y_boot_post_t_mean /= n_boot_treated as f64;
+
+            // Compute ATT with FIXED time_weights and renormalized omega
+            let tau = sdid_estimator_internal(
+                &y_boot_pre_c,
+                &y_boot_post_c,
+                &y_boot_pre_t_mean,
+                &y_boot_post_t_mean,
+                &boot_omega,
+                &lambda,
+            );
+
+            if tau.is_finite() {
+                Some(tau)
+            } else {
+                None
+            }
+        })
+        .collect();
+
+    let n_successful = bootstrap_estimates.len();
+    let n_failed = n_bootstrap - n_successful;
+
+    // Compute SE: std(estimates, ddof=1) — NO sqrt((r-1)/r) for bootstrap
+    let se = if n_successful < 2 {
+        0.0
+    } else {
+        let n = n_successful as f64;
+        let mean = bootstrap_estimates.iter().sum::<f64>() / n;
+        let variance = bootstrap_estimates
+            .iter()
+            .map(|x| (x - mean).powi(2))
+            .sum::<f64>()
+            / (n - 1.0);
+        variance.sqrt()
+    };
+
+    let estimates_arr = Array1::from_vec(bootstrap_estimates);
+    Ok((se, estimates_arr.to_pyarray_bound(py), n_failed))
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use ndarray::array;
+
+    #[test]
+    fn test_fisher_yates_permutation_length() {
+        use rand::SeedableRng;
+        use rand_xoshiro::Xoshiro256PlusPlus;
+        let mut rng = Xoshiro256PlusPlus::seed_from_u64(42);
+        let perm = fisher_yates_permutation(&mut rng, 10);
+        assert_eq!(perm.len(), 10);
+        // All elements should be present
+        let mut sorted = perm.clone();
+        sorted.sort();
+        assert_eq!(sorted, (0..10).collect::<Vec<_>>());
+    }
+
+    #[test]
+    fn test_fisher_yates_permutation_different_seeds() {
+        use rand::SeedableRng;
+        use rand_xoshiro::Xoshiro256PlusPlus;
+        let mut rng1 = Xoshiro256PlusPlus::seed_from_u64(42);
+        let mut rng2 = Xoshiro256PlusPlus::seed_from_u64(43);
+        let perm1 = fisher_yates_permutation(&mut rng1, 20);
+        let perm2 = fisher_yates_permutation(&mut rng2, 20);
+        assert_ne!(perm1, perm2);
+    }
+
+    #[test]
+    fn test_extract_submatrix_cols() {
+        let m = array![[1.0, 2.0, 3.0, 4.0], [5.0, 6.0, 7.0, 8.0]];
+        let sub = extract_submatrix_cols(&m, &[0, 2]);
+        assert_eq!(sub.nrows(), 2);
+        assert_eq!(sub.ncols(), 2);
+        assert!((sub[[0, 0]] - 1.0).abs() < 1e-10);
+        assert!((sub[[0, 1]] - 3.0).abs() < 1e-10);
+        assert!((sub[[1, 0]] - 5.0).abs() < 1e-10);
+        assert!((sub[[1, 1]] - 7.0).abs() < 1e-10);
+    }
+
+    #[test]
+    fn test_column_means() {
+        let m = array![[1.0, 2.0, 3.0, 4.0], [5.0, 6.0, 7.0, 8.0]];
+        let means = column_means(&m, &[1, 3]);
+        // Mean of columns 1 and 3:
+        // Row 0: (2+4)/2 = 3
+        // Row 1: (6+8)/2 = 7
+        assert!((means[0] - 3.0).abs() < 1e-10);
+        assert!((means[1] - 7.0).abs() < 1e-10);
+    }
+
+    #[test]
+    fn test_sdid_estimator_internal_zero_weights() {
+        // When all time weights are on last pre-period and unit weights are uniform,
+        // should reduce to a simpler DiD
+        let y_pre_c = array![[1.0, 2.0], [3.0, 4.0]]; // (2 pre, 2 control)
+        let y_post_c = array![[5.0, 6.0]]; // (1 post, 2 control)
+        let y_pre_t = array![2.0, 4.0]; // (2 pre,) means
+        let y_post_t = array![10.0]; // (1 post,) means
+
+        let omega = array![0.5, 0.5]; // uniform
+        let lambda = array![0.0, 1.0]; // all weight on last pre-period
+
+        let tau = sdid_estimator_internal(
+            &y_pre_c, &y_post_c, &y_pre_t, &y_post_t, &omega, &lambda,
+        );
+
+        // Manual computation:
+        // weighted_pre_control = [0, 1] @ [[1,2],[3,4]] = [3, 4]
+        // weighted_pre_treated = [0, 1] @ [2, 4] = 4
+        // mean_post_control = [5, 6]
+        // mean_post_treated = 10
+        // did_treated = 10 - 4 = 6
+        // did_control = [0.5, 0.5] @ ([5,6] - [3,4]) = [0.5, 0.5] @ [2, 2] = 2
+        // tau = 6 - 2 = 4
+        assert!((tau - 4.0).abs() < 1e-10, "Expected 4.0, got {}", tau);
+    }
+}
diff --git a/rust/src/weights.rs b/rust/src/weights.rs
index 40e3ae07..9b5cfb5d 100644
--- a/rust/src/weights.rs
+++ b/rust/src/weights.rs
@@ -1,10 +1,12 @@
-//! Synthetic control weight computation via projected gradient descent.
+//! Synthetic control weight computation.
 //!
 //! This module provides optimized implementations of:
-//! - Synthetic control weight optimization
+//! - Legacy synthetic control weight optimization (projected gradient descent)
+//! - Frank-Wolfe synthetic control weights (matching R's synthdid)
 //! - Simplex projection
+//! - SDID unit and time weight computation
 
-use ndarray::{Array1, ArrayView1, ArrayView2};
+use ndarray::{s, Array1, Array2, ArrayView1, ArrayView2, Axis};
 use numpy::{PyArray1, PyReadonlyArray1, PyReadonlyArray2, ToPyArray};
 use pyo3::prelude::*;
 
@@ -17,6 +19,10 @@ const DEFAULT_TOL: f64 = 1e-8;
 /// Default step size for gradient descent.
 const DEFAULT_STEP_SIZE: f64 = 0.1;
 
+// =========================================================================
+// Legacy synthetic control weights (projected gradient descent)
+// =========================================================================
+
 /// Compute synthetic control weights via projected gradient descent.
 ///
 /// Solves: min_w ||Y_treated - Y_control @ w||² + lambda * ||w||²
@@ -109,6 +115,10 @@ fn compute_synthetic_weights_internal(
     Ok(weights)
 }
 
+// =========================================================================
+// Simplex projection
+// =========================================================================
+
 /// Project a vector onto the probability simplex.
 ///
 /// Implements the O(n log n) algorithm from:
@@ -161,6 +171,396 @@ fn project_simplex_internal(v: &ArrayView1<f64>) -> Array1<f64> {
     v.mapv(|x| (x - theta).max(0.0))
 }
 
+// =========================================================================
+// Frank-Wolfe solver (matching R's synthdid)
+// =========================================================================
+
+/// Normalize vector to sum to 1. Fallback to uniform if sum is zero.
+/// Matches R's synthdid sum_normalize().
+pub(crate) fn sum_normalize_internal(v: &Array1<f64>) -> Array1<f64> {
+    let s: f64 = v.sum();
+    if s > 0.0 {
+        v / s
+    } else {
+        Array1::from_elem(v.len(), 1.0 / v.len() as f64)
+    }
+}
+
+/// Sparsify weight vector by zeroing out small entries.
+/// Matches R's synthdid sparsify_function:
+///   v[v <= max(v)/4] = 0; v = v / sum(v)
+fn sparsify_internal(v: &Array1<f64>) -> Array1<f64> {
+    let n = v.len();
+    let max_v = v.iter().cloned().fold(f64::NEG_INFINITY, f64::max);
+    if max_v <= 0.0 {
+        return Array1::from_elem(n, 1.0 / n as f64);
+    }
+    let threshold = max_v / 4.0;
+    let mut result = v.clone();
+    result.mapv_inplace(|x| if x <= threshold { 0.0 } else { x });
+    sum_normalize_internal(&result)
+}
+
+/// Single Frank-Wolfe step on the simplex.
+/// Matches R's fw.step() in synthdid's sc.weight.fw().
+fn fw_step_internal(
+    a: &ArrayView2<f64>,
+    x: &Array1<f64>,
+    b: &ArrayView1<f64>,
+    eta: f64,
+) -> Array1<f64> {
+    let ax = a.dot(x);
+    let diff = &ax - b;
+    let half_grad = a.t().dot(&diff) + eta * x;
+
+    // Find vertex with smallest gradient component
+    let i = half_grad
+        .iter()
+        .enumerate()
+        .min_by(|(_, a), (_, b)| a.partial_cmp(b).unwrap_or(std::cmp::Ordering::Equal))
+        .map(|(idx, _)| idx)
+        .unwrap_or(0);
+
+    // Direction: d_x = e_i - x
+    let mut d_x = -x.clone();
+    d_x[i] += 1.0;
+
+    // Check if direction is essentially zero
+    let d_x_norm_sq: f64 = d_x.iter().map(|&v| v * v).sum();
+    if d_x_norm_sq < 1e-24 {
+        return x.clone();
+    }
+
+    // Compute step size via exact line search
+    let d_err = a.column(i).to_owned() - &ax;
+    let denom = d_err.dot(&d_err) + eta * d_x.dot(&d_x);
+    if denom <= 0.0 {
+        return x.clone();
+    }
+    let step = -(half_grad.dot(&d_x)) / denom;
+    let step = step.max(0.0).min(1.0);
+
+    x + &(step * &d_x)
+}
+
+/// Compute synthetic control weights via Frank-Wolfe optimization.
+///
+/// Matches R's sc.weight.fw() from the synthdid package. Solves:
+///   min_{lambda on simplex}  zeta^2 * ||lambda||^2
+///       + (1/N) * ||A_centered @ lambda - b_centered||^2
+///
+/// # Arguments
+/// * `y` - Matrix of shape (N, T0+1). Last column is the target.
+/// * `zeta` - Regularization strength.
+/// * `intercept` - If true, column-center Y before optimization.
+/// * `init_weights` - Initial weights. If None, starts with uniform.
+/// * `min_decrease` - Convergence criterion: stop when objective decrease < min_decrease^2.
+/// * `max_iter` - Maximum number of iterations.
+///
+/// # Returns
+/// Weights of shape (T0,) on the simplex.
+fn sc_weight_fw_internal(
+    y: &ArrayView2<f64>,
+    zeta: f64,
+    intercept: bool,
+    init_weights: Option<&Array1<f64>>,
+    min_decrease: f64,
+    max_iter: usize,
+) -> Array1<f64> {
+    let t0 = y.ncols() - 1;
+    let n = y.nrows();
+
+    if t0 == 0 {
+        return Array1::ones(1);
+    }
+
+    // Column-center if using intercept — owned Array2 for the centered case
+    let y_owned: Array2<f64> = if intercept {
+        let col_means = y.mean_axis(Axis(0)).unwrap();
+        y - &col_means
+    } else {
+        y.to_owned()
+    };
+
+    let a = y_owned.slice(s![.., ..t0]);
+    let b = y_owned.column(t0);
+    let eta = n as f64 * zeta * zeta;
+
+    let mut lam = match init_weights {
+        Some(w) => w.clone(),
+        None => Array1::from_elem(t0, 1.0 / t0 as f64),
+    };
+
+    let min_decrease_sq = min_decrease * min_decrease;
+    let mut prev_val = f64::INFINITY;
+
+    for t in 0..max_iter {
+        lam = fw_step_internal(&a, &lam, &b, eta);
+
+        // Compute objective: zeta^2 * ||lam||^2 + (1/N) * ||Y @ [lam, -1]||^2
+        let mut lam_ext = Array1::zeros(t0 + 1);
+        lam_ext.slice_mut(s![..t0]).assign(&lam);
+        lam_ext[t0] = -1.0;
+        let err = y_owned.dot(&lam_ext);
+        let val = zeta * zeta * lam.dot(&lam) + err.dot(&err) / n as f64;
+
+        if t >= 1 && prev_val - val < min_decrease_sq {
+            break;
+        }
+        prev_val = val;
+    }
+
+    lam
+}
+
+/// Compute noise level from first-differences of control outcomes.
+///
+/// Matches R's sd(apply(Y[1:N0, 1:T0], 1, diff)).
+///
+/// # Arguments
+/// * `y_pre_control` - Control unit pre-treatment outcomes (n_pre, n_control)
+///
+/// # Returns
+/// Noise level (standard deviation of first-differences with ddof=1)
+#[pyfunction]
+pub fn compute_noise_level<'py>(
+    _py: Python<'py>,
+    y_pre_control: PyReadonlyArray2<'py, f64>,
+) -> PyResult<f64> {
+    let y = y_pre_control.as_array();
+    Ok(compute_noise_level_internal(&y))
+}
+
+fn compute_noise_level_internal(y_pre_control: &ArrayView2<f64>) -> f64 {
+    let n_pre = y_pre_control.nrows();
+    if n_pre < 2 {
+        return 0.0;
+    }
+
+    // First differences along time axis: (T_pre-1, N_co)
+    let n_diff = n_pre - 1;
+    let n_control = y_pre_control.ncols();
+    let total = n_diff * n_control;
+    if total == 0 {
+        return 0.0;
+    }
+
+    // Compute mean of first diffs
+    let mut sum = 0.0;
+    for t in 0..n_diff {
+        for j in 0..n_control {
+            sum += y_pre_control[[t + 1, j]] - y_pre_control[[t, j]];
+        }
+    }
+    let mean = sum / total as f64;
+
+    // Compute variance with ddof=1
+    let mut ss = 0.0;
+    for t in 0..n_diff {
+        for j in 0..n_control {
+            let d = (y_pre_control[[t + 1, j]] - y_pre_control[[t, j]]) - mean;
+            ss += d * d;
+        }
+    }
+
+    if total <= 1 {
+        return 0.0;
+    }
+    (ss / (total - 1) as f64).sqrt()
+}
+
+/// Expose the generic Frank-Wolfe solver to Python.
+///
+/// # Arguments
+/// * `y` - Matrix (N, T0+1). Last column is target.
+/// * `zeta` - Regularization strength.
+/// * `intercept` - Column-center if true.
+/// * `init_weights` - Optional initial weights.
+/// * `min_decrease` - Convergence threshold.
+/// * `max_iter` - Maximum iterations.
+#[pyfunction]
+#[pyo3(signature = (y, zeta, intercept=true, init_weights=None, min_decrease=1e-5, max_iter=10000))]
+pub fn sc_weight_fw<'py>(
+    py: Python<'py>,
+    y: PyReadonlyArray2<'py, f64>,
+    zeta: f64,
+    intercept: bool,
+    init_weights: Option<PyReadonlyArray1<'py, f64>>,
+    min_decrease: f64,
+    max_iter: usize,
+) -> PyResult<Bound<'py, PyArray1<f64>>> {
+    let y_arr = y.as_array();
+    let init = init_weights.map(|w| {
+        let v = w.as_array();
+        v.to_owned()
+    });
+    let result = sc_weight_fw_internal(
+        &y_arr,
+        zeta,
+        intercept,
+        init.as_ref(),
+        min_decrease,
+        max_iter,
+    );
+    Ok(result.to_pyarray_bound(py))
+}
+
+/// Compute SDID time weights via Frank-Wolfe optimization.
+///
+/// Matches R's synthdid: sc.weight.fw(Yc[1:N0, ], zeta=zeta.lambda, intercept=TRUE)
+///
+/// # Arguments
+/// * `y_pre_control` - Control outcomes in pre-treatment periods (n_pre, n_control)
+/// * `y_post_control` - Control outcomes in post-treatment periods (n_post, n_control)
+/// * `zeta_lambda` - Regularization parameter for time weights
+/// * `intercept` - Column-center if true
+/// * `min_decrease` - Convergence threshold
+/// * `max_iter` - Maximum iterations
+#[pyfunction]
+#[pyo3(signature = (y_pre_control, y_post_control, zeta_lambda, intercept=true, min_decrease=1e-5, max_iter_pre_sparsify=100, max_iter=10000))]
+pub fn compute_time_weights<'py>(
+    py: Python<'py>,
+    y_pre_control: PyReadonlyArray2<'py, f64>,
+    y_post_control: PyReadonlyArray2<'py, f64>,
+    zeta_lambda: f64,
+    intercept: bool,
+    min_decrease: f64,
+    max_iter_pre_sparsify: usize,
+    max_iter: usize,
+) -> PyResult<Bound<'py, PyArray1<f64>>> {
+    let y_pre = y_pre_control.as_array();
+    let y_post = y_post_control.as_array();
+
+    let result = compute_time_weights_internal(&y_pre, &y_post, zeta_lambda, intercept, min_decrease, max_iter_pre_sparsify, max_iter);
+    Ok(result.to_pyarray_bound(py))
+}
+
+pub(crate) fn compute_time_weights_internal(
+    y_pre_control: &ArrayView2<f64>,
+    y_post_control: &ArrayView2<f64>,
+    zeta_lambda: f64,
+    intercept: bool,
+    min_decrease: f64,
+    max_iter_pre_sparsify: usize,
+    max_iter: usize,
+) -> Array1<f64> {
+    let n_pre = y_pre_control.nrows();
+
+    if n_pre <= 1 {
+        return Array1::ones(n_pre);
+    }
+
+    let n_control = y_pre_control.ncols();
+
+    // Build collapsed form: (N_co, T_pre + 1), last col = per-control post mean
+    let mut y_time = Array2::zeros((n_control, n_pre + 1));
+
+    // Fill pre-period columns (transpose of y_pre_control)
+    for j in 0..n_control {
+        for t in 0..n_pre {
+            y_time[[j, t]] = y_pre_control[[t, j]];
+        }
+    }
+
+    // Fill last column with per-control post means
+    let n_post = y_post_control.nrows();
+    for j in 0..n_control {
+        let mut sum = 0.0;
+        for t in 0..n_post {
+            sum += y_post_control[[t, j]];
+        }
+        y_time[[j, n_pre]] = if n_post > 0 { sum / n_post as f64 } else { 0.0 };
+    }
+
+    // Two-pass sparsification (matching R's default sparsify=sparsify_function)
+    // First pass: limited iterations
+    let lam = sc_weight_fw_internal(&y_time.view(), zeta_lambda, intercept, None, min_decrease, max_iter_pre_sparsify);
+
+    // Sparsify
+    let lam_sparse = sparsify_internal(&lam);
+
+    // Second pass: from sparsified initialization
+    sc_weight_fw_internal(&y_time.view(), zeta_lambda, intercept, Some(&lam_sparse), min_decrease, max_iter)
+}
+
+/// Compute SDID unit weights via Frank-Wolfe with two-pass sparsification.
+///
+/// Matches R's synthdid: sc.weight.fw(t(Yc[, 1:T0]), zeta=zeta.omega, intercept=TRUE)
+/// followed by sparsify_function + second sc.weight.fw pass.
+///
+/// # Arguments
+/// * `y_pre_control` - Control outcomes in pre-treatment periods (n_pre, n_control)
+/// * `y_pre_treated_mean` - Mean treated outcomes in pre-treatment periods (n_pre,)
+/// * `zeta_omega` - Regularization parameter for unit weights
+/// * `intercept` - Column-center if true
+/// * `min_decrease` - Convergence threshold
+/// * `max_iter_pre_sparsify` - Iterations for first pass (before sparsification)
+/// * `max_iter` - Iterations for second pass (after sparsification)
+#[pyfunction]
+#[pyo3(signature = (y_pre_control, y_pre_treated_mean, zeta_omega, intercept=true, min_decrease=1e-5, max_iter_pre_sparsify=100, max_iter=10000))]
+pub fn compute_sdid_unit_weights<'py>(
+    py: Python<'py>,
+    y_pre_control: PyReadonlyArray2<'py, f64>,
+    y_pre_treated_mean: PyReadonlyArray1<'py, f64>,
+    zeta_omega: f64,
+    intercept: bool,
+    min_decrease: f64,
+    max_iter_pre_sparsify: usize,
+    max_iter: usize,
+) -> PyResult<Bound<'py, PyArray1<f64>>> {
+    let y_pre = y_pre_control.as_array();
+    let y_tr_mean = y_pre_treated_mean.as_array();
+
+    let result = compute_sdid_unit_weights_internal(
+        &y_pre, &y_tr_mean, zeta_omega, intercept, min_decrease,
+        max_iter_pre_sparsify, max_iter,
+    );
+    Ok(result.to_pyarray_bound(py))
+}
+
+pub(crate) fn compute_sdid_unit_weights_internal(
+    y_pre_control: &ArrayView2<f64>,
+    y_pre_treated_mean: &ArrayView1<f64>,
+    zeta_omega: f64,
+    intercept: bool,
+    min_decrease: f64,
+    max_iter_pre_sparsify: usize,
+    max_iter: usize,
+) -> Array1<f64> {
+    let n_control = y_pre_control.ncols();
+
+    if n_control == 0 {
+        return Array1::zeros(0);
+    }
+    if n_control == 1 {
+        return Array1::ones(1);
+    }
+
+    let n_pre = y_pre_control.nrows();
+
+    // Build collapsed form: (T_pre, N_co + 1), last col = treated pre means
+    let mut y_unit = Array2::zeros((n_pre, n_control + 1));
+    for t in 0..n_pre {
+        for j in 0..n_control {
+            y_unit[[t, j]] = y_pre_control[[t, j]];
+        }
+        y_unit[[t, n_control]] = y_pre_treated_mean[t];
+    }
+
+    // First pass: limited iterations
+    let omega = sc_weight_fw_internal(
+        &y_unit.view(), zeta_omega, intercept, None, min_decrease, max_iter_pre_sparsify,
+    );
+
+    // Sparsify: zero out weights <= max/4, renormalize
+    let omega = sparsify_internal(&omega);
+
+    // Second pass: from sparsified initialization
+    sc_weight_fw_internal(
+        &y_unit.view(), zeta_omega, intercept, Some(&omega), min_decrease, max_iter,
+    )
+}
+
 #[cfg(test)]
 mod tests {
     use super::*;
@@ -217,4 +617,97 @@ mod tests {
             "Weights should be non-negative"
         );
     }
+
+    #[test]
+    fn test_sum_normalize() {
+        let v = array![2.0, 3.0, 5.0];
+        let result = sum_normalize_internal(&v);
+        assert!((result.sum() - 1.0).abs() < 1e-10);
+        assert!((result[0] - 0.2).abs() < 1e-10);
+        assert!((result[1] - 0.3).abs() < 1e-10);
+        assert!((result[2] - 0.5).abs() < 1e-10);
+    }
+
+    #[test]
+    fn test_sum_normalize_zero() {
+        let v = array![0.0, 0.0, 0.0];
+        let result = sum_normalize_internal(&v);
+        assert!((result.sum() - 1.0).abs() < 1e-10);
+        for &x in result.iter() {
+            assert!((x - 1.0 / 3.0).abs() < 1e-10);
+        }
+    }
+
+    #[test]
+    fn test_sparsify() {
+        let v = array![0.5, 0.3, 0.1, 0.05, 0.05];
+        let result = sparsify_internal(&v);
+        // max = 0.5, threshold = 0.125
+        // 0.1, 0.05, 0.05 should be zeroed out
+        assert!((result.sum() - 1.0).abs() < 1e-10);
+        assert!(result[2] == 0.0); // 0.1 <= 0.125
+        assert!(result[3] == 0.0);
+        assert!(result[4] == 0.0);
+        assert!(result[0] > 0.0);
+        assert!(result[1] > 0.0);
+    }
+
+    #[test]
+    fn test_noise_level_basic() {
+        // 3 pre-periods, 2 control units
+        // Unit 0: [1.0, 2.0, 3.0] -> diffs: [1.0, 1.0]
+        // Unit 1: [2.0, 4.0, 6.0] -> diffs: [2.0, 2.0]
+        // All diffs: [1.0, 1.0, 2.0, 2.0], mean=1.5, sd=sqrt(sum((d-1.5)^2)/3)
+        let y = array![[1.0, 2.0], [2.0, 4.0], [3.0, 6.0]];
+        let nl = compute_noise_level_internal(&y.view());
+        // Diffs: [1.0, 2.0, 1.0, 2.0], mean=1.5
+        // Var = (0.25+0.25+0.25+0.25)/3 = 1.0/3
+        // sd = sqrt(1/3) ≈ 0.5774
+        assert!((nl - (1.0_f64 / 3.0).sqrt()).abs() < 1e-10);
+    }
+
+    #[test]
+    fn test_fw_weights_on_simplex() {
+        // Simple 3x3 problem: 2 pre-periods + 1 target column
+        let y = array![[1.0, 2.0, 1.5], [3.0, 4.0, 3.5], [5.0, 6.0, 5.5]];
+        let result = sc_weight_fw_internal(&y.view(), 0.1, true, None, 1e-3, 100);
+        let sum: f64 = result.sum();
+        assert!((sum - 1.0).abs() < 1e-6, "FW weights should sum to 1, got {}", sum);
+        assert!(result.iter().all(|&w| w >= -1e-6), "FW weights should be non-negative");
+    }
+
+    #[test]
+    fn test_time_weights_on_simplex() {
+        let y_pre = array![[1.0, 2.0, 3.0], [4.0, 5.0, 6.0], [7.0, 8.0, 9.0]];
+        let y_post = array![[10.0, 11.0, 12.0]];
+        let result = compute_time_weights_internal(&y_pre.view(), &y_post.view(), 0.1, true, 1e-3, 100, 1000);
+        assert_eq!(result.len(), 3);
+        let sum: f64 = result.sum();
+        assert!((sum - 1.0).abs() < 1e-6, "Time weights should sum to 1, got {}", sum);
+        assert!(result.iter().all(|&w| w >= -1e-6), "Time weights should be non-negative");
+    }
+
+    #[test]
+    fn test_unit_weights_on_simplex() {
+        let y_pre = array![[1.0, 2.0, 3.0], [4.0, 5.0, 6.0], [7.0, 8.0, 9.0]];
+        let y_tr_mean = array![2.0, 5.0, 8.0];
+        let result = compute_sdid_unit_weights_internal(
+            &y_pre.view(), &y_tr_mean.view(), 0.5, true, 1e-3, 100, 1000,
+        );
+        assert_eq!(result.len(), 3);
+        let sum: f64 = result.sum();
+        assert!((sum - 1.0).abs() < 1e-6, "Unit weights should sum to 1, got {}", sum);
+        assert!(result.iter().all(|&w| w >= -1e-6), "Unit weights should be non-negative");
+    }
+
+    #[test]
+    fn test_unit_weights_single_control() {
+        let y_pre = array![[1.0], [2.0], [3.0]];
+        let y_tr_mean = array![1.5, 2.5, 3.5];
+        let result = compute_sdid_unit_weights_internal(
+            &y_pre.view(), &y_tr_mean.view(), 0.5, true, 1e-3, 100, 1000,
+        );
+        assert_eq!(result.len(), 1);
+        assert!((result[0] - 1.0).abs() < 1e-10);
+    }
 }
diff --git a/tests/test_estimators.py b/tests/test_estimators.py
index 3a055106..ab394a2b 100644
--- a/tests/test_estimators.py
+++ b/tests/test_estimators.py
@@ -2512,8 +2512,8 @@ def test_single_treated_unit(self, single_treated_unit_data, ci_params):
 
     def test_regularization_effect(self, sdid_panel_data):
         """Test that regularization affects weight dispersion."""
-        sdid_no_reg = SyntheticDiD(lambda_reg=0.0, variance_method="placebo", seed=42)
-        sdid_high_reg = SyntheticDiD(lambda_reg=10.0, variance_method="placebo", seed=42)
+        sdid_no_reg = SyntheticDiD(zeta_omega=0.01, variance_method="placebo", seed=42)
+        sdid_high_reg = SyntheticDiD(zeta_omega=100.0, variance_method="placebo", seed=42)
 
         results_no_reg = sdid_no_reg.fit(
             sdid_panel_data,
@@ -2721,21 +2721,42 @@ def test_is_significant_property(self, sdid_panel_data, ci_params):
         assert isinstance(results.is_significant, bool)
 
     def test_get_set_params(self):
-        """Test get_params and set_params."""
-        sdid = SyntheticDiD(lambda_reg=1.0, zeta=0.5, alpha=0.10, variance_method="placebo")
+        """Test get_params and set_params with new parameter names."""
+        sdid = SyntheticDiD(zeta_omega=1.0, zeta_lambda=0.5, alpha=0.10, variance_method="placebo")
 
         params = sdid.get_params()
-        assert params["lambda_reg"] == 1.0
-        assert params["zeta"] == 0.5
+        assert params["zeta_omega"] == 1.0
+        assert params["zeta_lambda"] == 0.5
         assert params["alpha"] == 0.10
         assert params["variance_method"] == "placebo"
 
-        sdid.set_params(lambda_reg=2.0)
-        assert sdid.lambda_reg == 2.0
+        sdid.set_params(zeta_omega=2.0)
+        assert sdid.zeta_omega == 2.0
 
         sdid.set_params(variance_method="bootstrap")
         assert sdid.variance_method == "bootstrap"
 
+    def test_deprecated_params(self):
+        """Test that old parameter names emit DeprecationWarning."""
+        import warnings as _warnings
+
+        with _warnings.catch_warnings(record=True) as w:
+            _warnings.simplefilter("always")
+            sdid = SyntheticDiD(lambda_reg=1.0, zeta=0.5)
+            dep_warnings = [x for x in w if issubclass(x.category, DeprecationWarning)]
+            assert len(dep_warnings) == 2
+
+        # Deprecated params are ignored — auto-computed regularization is used
+        assert sdid.zeta_omega is None
+        assert sdid.zeta_lambda is None
+
+        # set_params with deprecated names also warns
+        with _warnings.catch_warnings(record=True) as w:
+            _warnings.simplefilter("always")
+            sdid.set_params(lambda_reg=2.0)
+            dep_warnings = [x for x in w if issubclass(x.category, DeprecationWarning)]
+            assert len(dep_warnings) == 1
+
     def test_missing_unit_column(self, sdid_panel_data):
         """Test error when unit column is missing."""
         sdid = SyntheticDiD()
@@ -3035,7 +3056,7 @@ def test_more_pre_periods_than_control_units(self, ci_params):
 
         # Use regularization to help with underdetermined system
         n_boot = ci_params.bootstrap(30)
-        sdid = SyntheticDiD(lambda_reg=1.0, n_bootstrap=n_boot, seed=42)
+        sdid = SyntheticDiD(zeta_omega=1.0, n_bootstrap=n_boot, seed=42)
 
         results = sdid.fit(
             df,
@@ -3097,22 +3118,23 @@ def test_compute_synthetic_weights(self):
         assert len(weights) == n_control
 
     def test_compute_time_weights(self):
-        """Test time weight computation."""
+        """Test time weight computation with Frank-Wolfe solver."""
         from diff_diff.utils import compute_time_weights
 
         np.random.seed(42)
         n_pre = 5
+        n_post = 3
         n_control = 10
 
-        Y_control = np.random.randn(n_pre, n_control)
-        Y_treated = np.random.randn(n_pre)
+        Y_pre = np.random.randn(n_pre, n_control)
+        Y_post = np.random.randn(n_post, n_control)
 
-        weights = compute_time_weights(Y_control, Y_treated)
+        weights = compute_time_weights(Y_pre, Y_post, zeta_lambda=0.01)
 
         # Weights should sum to 1
         assert abs(np.sum(weights) - 1.0) < 1e-6
         # Weights should be non-negative
-        assert np.all(weights >= 0)
+        assert np.all(weights >= -1e-10)
         # Should have correct length
         assert len(weights) == n_pre
 
diff --git a/tests/test_methodology_sdid.py b/tests/test_methodology_sdid.py
new file mode 100644
index 00000000..812392c5
--- /dev/null
+++ b/tests/test_methodology_sdid.py
@@ -0,0 +1,605 @@
+"""
+Methodology tests for Synthetic Difference-in-Differences (SDID).
+
+Tests verify the implementation matches Arkhangelsky et al. (2021) and
+R's synthdid package behavior: Frank-Wolfe solver, collapsed form,
+auto-regularization, sparsification, and correct bootstrap/placebo SE.
+"""
+
+import warnings
+
+import numpy as np
+import pytest
+
+from diff_diff.synthetic_did import SyntheticDiD
+from diff_diff.utils import (
+    _compute_noise_level,
+    _compute_regularization,
+    _fw_step,
+    _sc_weight_fw,
+    _sparsify,
+    _sum_normalize,
+    compute_sdid_estimator,
+    compute_sdid_unit_weights,
+    compute_time_weights,
+)
+
+
+# =============================================================================
+# Test Helpers
+# =============================================================================
+
+
+def _make_panel(n_control=20, n_treated=3, n_pre=5, n_post=3,
+                att=5.0, seed=42):
+    """Create a simple panel dataset for testing."""
+    rng = np.random.default_rng(seed)
+    data = []
+    for unit in range(n_control + n_treated):
+        is_treated = unit >= n_control
+        unit_fe = rng.normal(0, 2)
+        for t in range(n_pre + n_post):
+            y = 10.0 + unit_fe + t * 0.3 + rng.normal(0, 0.5)
+            if is_treated and t >= n_pre:
+                y += att
+            data.append({
+                "unit": unit,
+                "period": t,
+                "treated": int(is_treated),
+                "outcome": y,
+            })
+    import pandas as pd
+    return pd.DataFrame(data)
+
+
+# =============================================================================
+# Phase A: Noise Level and Regularization
+# =============================================================================
+
+
+class TestNoiseLevel:
+    """Verify _compute_noise_level matches hand-computed first-diff sd."""
+
+    def test_known_values(self):
+        """Test with a simple matrix where first-diffs are known."""
+        # 3 time periods, 2 control units
+        # Unit 0: [1, 3, 6] -> diffs: [2, 3]
+        # Unit 1: [2, 2, 5] -> diffs: [0, 3]
+        # All diffs: [2, 3, 0, 3], sd(ddof=1) = std([2,3,0,3], ddof=1)
+        Y = np.array([[1.0, 2.0],
+                       [3.0, 2.0],
+                       [6.0, 5.0]])
+        expected = np.std([2.0, 3.0, 0.0, 3.0], ddof=1)
+        result = _compute_noise_level(Y)
+        assert abs(result - expected) < 1e-10
+
+    def test_single_period(self):
+        """Single period -> no diffs possible -> noise level = 0."""
+        Y = np.array([[1.0, 2.0, 3.0]])
+        assert _compute_noise_level(Y) == 0.0
+
+    def test_two_periods(self):
+        """Two periods -> one diff per unit."""
+        Y = np.array([[1.0, 4.0],
+                       [3.0, 7.0]])
+        # Diffs: [2.0, 3.0], sd(ddof=1)
+        expected = np.std([2.0, 3.0], ddof=1)
+        assert abs(_compute_noise_level(Y) - expected) < 1e-10
+
+
+class TestRegularization:
+    """Verify _compute_regularization formula with known inputs."""
+
+    def test_formula(self):
+        """Check zeta_omega = (N1*T1)^0.25 * sigma, zeta_lambda = 1e-6 * sigma."""
+        # Use a simple Y_pre_control where sigma is easy to compute
+        Y = np.array([[1.0, 2.0],
+                       [3.0, 4.0],
+                       [6.0, 7.0]])
+        sigma = _compute_noise_level(Y)
+        n_treated, n_post = 2, 3
+
+        zeta_omega, zeta_lambda = _compute_regularization(Y, n_treated, n_post)
+
+        expected_omega = (n_treated * n_post) ** 0.25 * sigma
+        expected_lambda = 1e-6 * sigma
+
+        assert abs(zeta_omega - expected_omega) < 1e-10
+        assert abs(zeta_lambda - expected_lambda) < 1e-15
+
+    def test_zero_noise(self):
+        """Constant outcomes -> zero noise -> zero regularization."""
+        Y = np.array([[5.0, 5.0],
+                       [5.0, 5.0],
+                       [5.0, 5.0]])
+        zo, zl = _compute_regularization(Y, 2, 3)
+        assert zo == 0.0
+        assert zl == 0.0
+
+
+# =============================================================================
+# Phase B: Frank-Wolfe Solver
+# =============================================================================
+
+
+class TestFrankWolfe:
+    """Verify Frank-Wolfe step and solver behavior."""
+
+    def test_fw_step_descent(self):
+        """A single FW step should not increase the half-gradient objective.
+
+        The FW step minimizes the linearized objective at the current point.
+        After the step with exact line search, the true objective should
+        not increase when measured correctly.
+        """
+        rng = np.random.default_rng(42)
+        N, T0 = 10, 5
+        A = rng.standard_normal((N, T0))
+        b = rng.standard_normal(N)
+        eta = N * 0.1 ** 2  # eta = N * zeta^2 matching R's formulation
+
+        x = np.ones(T0) / T0
+
+        # Run a few steps to get away from the initial uniform point
+        # (first step from uniform can have numerical issues)
+        for _ in range(5):
+            x = _fw_step(A, x, b, eta)
+
+        def objective(lam):
+            err = A @ lam - b
+            return (eta / N) * np.sum(lam**2) + np.sum(err**2) / N
+
+        obj_before = objective(x)
+        x_new = _fw_step(A, x, b, eta)
+        obj_after = objective(x_new)
+
+        assert obj_after <= obj_before + 1e-8
+
+    def test_fw_step_on_simplex(self):
+        """FW step should return a vector on the simplex."""
+        rng = np.random.default_rng(42)
+        A = rng.standard_normal((8, 4))
+        b = rng.standard_normal(8)
+        x = np.array([0.25, 0.25, 0.25, 0.25])
+
+        x_new = _fw_step(A, x, b, eta=1.0)
+        assert np.all(x_new >= -1e-10)
+        assert abs(np.sum(x_new) - 1.0) < 1e-10
+
+    def test_sc_weight_fw_converges(self):
+        """Full FW solver should converge on a known QP."""
+        rng = np.random.default_rng(42)
+        N, T0 = 15, 6
+        Y = rng.standard_normal((N, T0 + 1))  # last col is target
+
+        lam = _sc_weight_fw(Y, zeta=0.1, max_iter=1000)
+        assert np.all(lam >= -1e-10)
+        assert abs(np.sum(lam) - 1.0) < 1e-6
+
+    def test_sc_weight_fw_max_iter_zero(self):
+        """max_iter=0 should return initial uniform weights."""
+        Y = np.random.randn(5, 4)  # (N, T0+1) with T0=3
+        lam = _sc_weight_fw(Y, zeta=0.1, max_iter=0)
+        expected = np.ones(3) / 3
+        np.testing.assert_allclose(lam, expected, atol=1e-10)
+
+    def test_sc_weight_fw_max_iter_one(self):
+        """max_iter=1 should return weights after one step (still on simplex)."""
+        rng = np.random.default_rng(99)
+        Y = rng.standard_normal((8, 5))
+        lam = _sc_weight_fw(Y, zeta=0.1, max_iter=1)
+        assert np.all(lam >= -1e-10)
+        assert abs(np.sum(lam) - 1.0) < 1e-10
+
+    def test_intercept_centering(self):
+        """With intercept=True, column-centering should occur."""
+        rng = np.random.default_rng(42)
+        Y = rng.standard_normal((10, 5)) + 100  # large offset
+        lam_intercept = _sc_weight_fw(Y, zeta=0.1, intercept=True)
+        lam_no_intercept = _sc_weight_fw(Y, zeta=0.1, intercept=False)
+        # Both should be on simplex but may differ
+        assert abs(np.sum(lam_intercept) - 1.0) < 1e-6
+        assert abs(np.sum(lam_no_intercept) - 1.0) < 1e-6
+        # They should be different because centering matters
+        assert not np.allclose(lam_intercept, lam_no_intercept, atol=1e-3)
+
+
+class TestSparsify:
+    """Verify sparsification behavior."""
+
+    def test_basic(self):
+        """Weights below max/4 should be zeroed."""
+        v = np.array([0.8, 0.1, 0.05, 0.05])
+        result = _sparsify(v)
+        assert result[0] > 0
+        # 0.1 < 0.8/4 = 0.2, so should be zeroed
+        assert result[1] == 0.0
+        assert result[2] == 0.0
+        assert result[3] == 0.0
+        assert abs(np.sum(result) - 1.0) < 1e-10
+
+    def test_all_zero(self):
+        """All-zero input should return uniform weights."""
+        v = np.zeros(5)
+        result = _sparsify(v)
+        np.testing.assert_allclose(result, np.ones(5) / 5)
+
+    def test_single_nonzero(self):
+        """Single nonzero element -> that element becomes 1.0."""
+        v = np.array([0.0, 0.0, 0.5, 0.0])
+        result = _sparsify(v)
+        assert result[2] == 1.0
+        assert np.sum(result) == 1.0
+
+    def test_equal_weights(self):
+        """Equal weights: all equal max, so max/4 threshold keeps them all."""
+        v = np.array([0.25, 0.25, 0.25, 0.25])
+        result = _sparsify(v)
+        # 0.25 > 0.25/4 = 0.0625, so all kept
+        np.testing.assert_allclose(result, v, atol=1e-10)
+
+
+class TestSumNormalize:
+    """Verify _sum_normalize helper."""
+
+    def test_basic(self):
+        v = np.array([2.0, 3.0, 5.0])
+        result = _sum_normalize(v)
+        np.testing.assert_allclose(result, [0.2, 0.3, 0.5])
+
+    def test_zero_sum(self):
+        """Zero-sum vector -> uniform weights."""
+        v = np.array([0.0, 0.0, 0.0])
+        result = _sum_normalize(v)
+        np.testing.assert_allclose(result, [1.0/3, 1.0/3, 1.0/3])
+
+
+# =============================================================================
+# Phase C/D: Unit and Time Weights
+# =============================================================================
+
+
+class TestUnitWeights:
+    """Verify compute_sdid_unit_weights behavior."""
+
+    def test_simplex_constraint(self):
+        """Weights should be on the simplex (sum to 1, non-negative)."""
+        rng = np.random.default_rng(42)
+        Y_pre = rng.standard_normal((8, 15))
+        Y_pre_treated_mean = rng.standard_normal(8)
+
+        omega = compute_sdid_unit_weights(Y_pre, Y_pre_treated_mean, zeta_omega=1.0)
+
+        assert np.all(omega >= -1e-10)
+        assert abs(np.sum(omega) - 1.0) < 1e-6
+
+    def test_single_control(self):
+        """Single control unit -> weight = [1.0]."""
+        Y_pre = np.array([[1.0], [2.0], [3.0]])
+        Y_pre_treated_mean = np.array([1.5, 2.5, 3.5])
+
+        omega = compute_sdid_unit_weights(Y_pre, Y_pre_treated_mean, zeta_omega=1.0)
+
+        assert len(omega) == 1
+        assert abs(omega[0] - 1.0) < 1e-10
+
+    def test_empty_control(self):
+        """No control units -> empty array."""
+        Y_pre = np.zeros((5, 0))
+        Y_pre_treated_mean = np.array([1.0, 2.0, 3.0, 4.0, 5.0])
+
+        omega = compute_sdid_unit_weights(Y_pre, Y_pre_treated_mean, zeta_omega=1.0)
+
+        assert len(omega) == 0
+
+    def test_sparsification_occurs(self):
+        """With enough controls, some weights should be zeroed by sparsification."""
+        rng = np.random.default_rng(42)
+        # Many controls with varied patterns — expect some to get zeroed
+        Y_pre = rng.standard_normal((10, 50))
+        Y_pre_treated_mean = rng.standard_normal(10)
+
+        omega = compute_sdid_unit_weights(Y_pre, Y_pre_treated_mean, zeta_omega=0.5)
+
+        # At least some weights should be exactly zero after sparsification
+        assert np.sum(omega == 0) > 0
+
+
+class TestTimeWeights:
+    """Verify compute_time_weights behavior."""
+
+    def test_simplex_constraint(self):
+        """Weights should be on the simplex."""
+        rng = np.random.default_rng(42)
+        Y_pre = rng.standard_normal((8, 15))
+        Y_post = rng.standard_normal((3, 15))
+
+        lam = compute_time_weights(Y_pre, Y_post, zeta_lambda=0.01)
+
+        assert np.all(lam >= -1e-10)
+        assert abs(np.sum(lam) - 1.0) < 1e-6
+
+    def test_single_pre_period(self):
+        """Single pre-period -> weight = [1.0]."""
+        Y_pre = np.array([[1.0, 2.0, 3.0]])
+        Y_post = np.array([[4.0, 5.0, 6.0]])
+
+        lam = compute_time_weights(Y_pre, Y_post, zeta_lambda=0.01)
+
+        assert len(lam) == 1
+        assert abs(lam[0] - 1.0) < 1e-10
+
+    def test_collapsed_form_correctness(self):
+        """Verify the collapsed form matrix is built correctly.
+
+        The time weight optimization solves on (N_co, T_pre+1) where the
+        last column is the per-control post-period mean.
+        """
+        rng = np.random.default_rng(42)
+        Y_pre = rng.standard_normal((4, 3))  # 4 pre-periods, 3 controls
+        Y_post = rng.standard_normal((2, 3))  # 2 post-periods, 3 controls
+
+        lam = compute_time_weights(Y_pre, Y_post, zeta_lambda=0.01)
+
+        # Should have 4 weights (one per pre-period)
+        assert len(lam) == 4
+        assert abs(np.sum(lam) - 1.0) < 1e-6
+
+
+# =============================================================================
+# Full Pipeline
+# =============================================================================
+
+
+class TestATTFullPipeline:
+    """Test full SDID estimation pipeline."""
+
+    def test_estimation_produces_reasonable_att(self, ci_params):
+        """Full estimation on canonical data should produce reasonable ATT."""
+        df = _make_panel(n_control=20, n_treated=3, n_pre=6, n_post=3,
+                         att=5.0, seed=42)
+        n_boot = ci_params.bootstrap(50)
+        sdid = SyntheticDiD(n_bootstrap=n_boot, seed=42, variance_method="placebo")
+        results = sdid.fit(
+            df, outcome="outcome", treatment="treated",
+            unit="unit", time="period",
+            post_periods=list(range(6, 9)),
+        )
+
+        # ATT should be positive and reasonably close to true value
+        assert results.att > 0
+        assert abs(results.att - 5.0) < 3.0
+
+    def test_results_have_regularization_info(self):
+        """Results should include noise_level, zeta_omega, zeta_lambda."""
+        df = _make_panel(seed=42)
+        sdid = SyntheticDiD(variance_method="placebo", seed=42)
+        results = sdid.fit(
+            df, outcome="outcome", treatment="treated",
+            unit="unit", time="period",
+            post_periods=list(range(5, 8)),
+        )
+
+        assert results.noise_level is not None
+        assert results.noise_level >= 0
+        assert results.zeta_omega is not None
+        assert results.zeta_omega >= 0
+        assert results.zeta_lambda is not None
+        assert results.zeta_lambda >= 0
+
+    def test_user_override_regularization(self):
+        """User-specified zeta_omega/zeta_lambda should be used instead of auto."""
+        df = _make_panel(seed=42)
+        sdid = SyntheticDiD(
+            zeta_omega=99.0, zeta_lambda=0.5,
+            variance_method="placebo", seed=42
+        )
+        results = sdid.fit(
+            df, outcome="outcome", treatment="treated",
+            unit="unit", time="period",
+            post_periods=list(range(5, 8)),
+        )
+
+        assert results.zeta_omega == 99.0
+        assert results.zeta_lambda == 0.5
+
+
+# =============================================================================
+# Placebo SE
+# =============================================================================
+
+
+class TestPlaceboSE:
+    """Verify placebo variance formula."""
+
+    def test_placebo_se_formula(self):
+        """SE should be sqrt((r-1)/r) * sd(estimates, ddof=1)."""
+        df = _make_panel(n_control=15, n_treated=2, seed=42)
+        sdid = SyntheticDiD(
+            variance_method="placebo", n_bootstrap=100, seed=42
+        )
+        results = sdid.fit(
+            df, outcome="outcome", treatment="treated",
+            unit="unit", time="period",
+            post_periods=list(range(5, 8)),
+        )
+
+        assert results.se > 0
+        assert results.variance_method == "placebo"
+
+        # Verify the formula: se = sqrt((r-1)/r) * sd(placebo_estimates)
+        if results.placebo_effects is not None:
+            r = len(results.placebo_effects)
+            expected_se = np.sqrt((r - 1) / r) * np.std(results.placebo_effects, ddof=1)
+            assert abs(results.se - expected_se) < 1e-10
+
+
+# =============================================================================
+# Bootstrap SE
+# =============================================================================
+
+
+class TestBootstrapSE:
+    """Verify bootstrap SE with fixed weights."""
+
+    def test_bootstrap_se_positive(self, ci_params):
+        """Bootstrap SE should be positive."""
+        df = _make_panel(n_control=20, n_treated=3, seed=42)
+        n_boot = ci_params.bootstrap(50)
+        sdid = SyntheticDiD(
+            variance_method="bootstrap", n_bootstrap=n_boot, seed=42
+        )
+        results = sdid.fit(
+            df, outcome="outcome", treatment="treated",
+            unit="unit", time="period",
+            post_periods=list(range(5, 8)),
+        )
+
+        assert results.se > 0
+        assert results.variance_method == "bootstrap"
+
+
+# =============================================================================
+# Edge Cases
+# =============================================================================
+
+
+class TestEdgeCases:
+    """Edge case handling."""
+
+    def test_single_treated_unit(self, ci_params):
+        """Estimation should work with a single treated unit."""
+        df = _make_panel(n_control=10, n_treated=1, n_pre=5, n_post=2,
+                         att=3.0, seed=42)
+        n_boot = ci_params.bootstrap(30)
+        sdid = SyntheticDiD(n_bootstrap=n_boot, seed=42)
+        results = sdid.fit(
+            df, outcome="outcome", treatment="treated",
+            unit="unit", time="period",
+            post_periods=[5, 6],
+        )
+        assert np.isfinite(results.att)
+
+    def test_insufficient_controls_for_placebo(self):
+        """Placebo with n_control <= n_treated should warn and return SE=0."""
+        df = _make_panel(n_control=2, n_treated=3, n_pre=5, n_post=2, seed=42)
+        sdid = SyntheticDiD(variance_method="placebo", seed=42)
+
+        with warnings.catch_warnings(record=True) as w:
+            warnings.simplefilter("always")
+            results = sdid.fit(
+                df, outcome="outcome", treatment="treated",
+                unit="unit", time="period",
+                post_periods=[5, 6],
+            )
+            user_warnings = [x for x in w if issubclass(x.category, UserWarning)]
+            # Should warn about insufficient controls for placebo
+            assert len(user_warnings) > 0
+
+        assert results.se == 0.0
+
+    def test_se_zero_propagation(self):
+        """When SE=0, t_stat and p_value should be NaN, CI should be NaN."""
+        df = _make_panel(n_control=2, n_treated=3, n_pre=5, n_post=2, seed=42)
+        sdid = SyntheticDiD(variance_method="placebo", seed=42)
+
+        with warnings.catch_warnings(record=True):
+            warnings.simplefilter("always")
+            results = sdid.fit(
+                df, outcome="outcome", treatment="treated",
+                unit="unit", time="period",
+                post_periods=[5, 6],
+            )
+
+        if results.se == 0.0:
+            assert np.isnan(results.t_stat)
+            assert np.isnan(results.p_value)
+            assert np.isnan(results.conf_int[0])
+            assert np.isnan(results.conf_int[1])
+
+
+# =============================================================================
+# get_params / set_params
+# =============================================================================
+
+
+class TestGetSetParams:
+    """Verify parameter accessors."""
+
+    def test_get_params_includes_new_names(self):
+        """get_params should include zeta_omega/zeta_lambda."""
+        sdid = SyntheticDiD(zeta_omega=1.0, zeta_lambda=0.5)
+        params = sdid.get_params()
+        assert "zeta_omega" in params
+        assert "zeta_lambda" in params
+        assert params["zeta_omega"] == 1.0
+        assert params["zeta_lambda"] == 0.5
+
+    def test_get_params_excludes_old_names(self):
+        """get_params should NOT include lambda_reg or zeta."""
+        sdid = SyntheticDiD()
+        params = sdid.get_params()
+        assert "lambda_reg" not in params
+        assert "zeta" not in params
+
+    def test_set_params_new_names(self):
+        """set_params with new names should work."""
+        sdid = SyntheticDiD()
+        sdid.set_params(zeta_omega=2.0, zeta_lambda=0.1)
+        assert sdid.zeta_omega == 2.0
+        assert sdid.zeta_lambda == 0.1
+
+    def test_set_params_deprecated_names_warn(self):
+        """set_params with old names should emit DeprecationWarning."""
+        sdid = SyntheticDiD()
+        with warnings.catch_warnings(record=True) as w:
+            warnings.simplefilter("always")
+            sdid.set_params(lambda_reg=1.0)
+            dep_warnings = [x for x in w if issubclass(x.category, DeprecationWarning)]
+            assert len(dep_warnings) == 1
+
+    def test_set_params_unknown_raises(self):
+        """set_params with unknown name should raise ValueError."""
+        sdid = SyntheticDiD()
+        with pytest.raises(ValueError, match="Unknown parameter"):
+            sdid.set_params(nonexistent_param=1.0)
+
+
+class TestDeprecatedParams:
+    """Test deprecated parameter handling in __init__."""
+
+    def test_lambda_reg_warns(self):
+        """SyntheticDiD(lambda_reg=...) emits DeprecationWarning."""
+        with warnings.catch_warnings(record=True) as w:
+            warnings.simplefilter("always")
+            sdid = SyntheticDiD(lambda_reg=0.1)
+            dep = [x for x in w if issubclass(x.category, DeprecationWarning)]
+            assert len(dep) == 1
+            assert "lambda_reg" in str(dep[0].message)
+
+        # Deprecated param is ignored — auto-computed used
+        assert sdid.zeta_omega is None
+
+    def test_zeta_warns(self):
+        """SyntheticDiD(zeta=...) emits DeprecationWarning."""
+        with warnings.catch_warnings(record=True) as w:
+            warnings.simplefilter("always")
+            sdid = SyntheticDiD(zeta=2.0)
+            dep = [x for x in w if issubclass(x.category, DeprecationWarning)]
+            assert len(dep) == 1
+            assert "zeta" in str(dep[0].message)
+
+        assert sdid.zeta_lambda is None
+
+    def test_both_deprecated_params(self):
+        """Both deprecated params at once should emit two warnings."""
+        with warnings.catch_warnings(record=True) as w:
+            warnings.simplefilter("always")
+            SyntheticDiD(lambda_reg=0.5, zeta=1.5)
+            dep = [x for x in w if issubclass(x.category, DeprecationWarning)]
+            assert len(dep) == 2
+
+    def test_default_variance_method_is_placebo(self):
+        """Default variance_method should be 'placebo' (matching R)."""
+        sdid = SyntheticDiD()
+        assert sdid.variance_method == "placebo"
diff --git a/tests/test_rust_backend.py b/tests/test_rust_backend.py
index 8269b5e9..6bcc2698 100644
--- a/tests/test_rust_backend.py
+++ b/tests/test_rust_backend.py
@@ -1667,6 +1667,484 @@ def test_trop_joint_treated_pre_nan_rust_python_parity(self):
             f"differ by {att_diff:.3f}, should be < 0.5"
 
 
+@pytest.mark.skipif(not HAS_RUST_BACKEND, reason="Rust backend not available")
+class TestSDIDRustBackend:
+    """Test suite for SDID Frank-Wolfe Rust backend functions."""
+
+    def test_noise_level_matches_numpy(self):
+        """Test Rust noise level matches NumPy implementation."""
+        from diff_diff._rust_backend import compute_noise_level as rust_fn
+        from diff_diff.utils import _compute_noise_level_numpy as numpy_fn
+
+        np.random.seed(42)
+        Y_pre = np.random.randn(10, 5)
+        rust_nl = rust_fn(Y_pre)
+        numpy_nl = numpy_fn(Y_pre)
+        assert abs(rust_nl - numpy_nl) < 1e-10, \
+            f"Noise levels differ: rust={rust_nl}, numpy={numpy_nl}"
+
+    def test_noise_level_single_period(self):
+        """Test noise level returns 0 for single pre-period."""
+        from diff_diff._rust_backend import compute_noise_level as rust_fn
+
+        Y_pre = np.random.randn(1, 5)
+        assert rust_fn(Y_pre) == 0.0
+
+    def test_sc_weight_fw_on_simplex(self):
+        """Test Frank-Wolfe solver produces valid simplex weights."""
+        from diff_diff._rust_backend import sc_weight_fw as rust_fn
+
+        np.random.seed(42)
+        Y = np.random.randn(5, 4)  # 5 rows, 3 pre-periods + 1 target
+        weights = rust_fn(Y, 0.1, True, None, 1e-3, 100)
+        assert abs(weights.sum() - 1.0) < 1e-6, f"Weights should sum to 1, got {weights.sum()}"
+        assert np.all(weights >= -1e-6), "Weights should be non-negative"
+        assert weights.shape == (3,), f"Expected shape (3,), got {weights.shape}"
+
+    def test_sc_weight_fw_matches_numpy(self):
+        """Test Rust Frank-Wolfe matches Python implementation."""
+        from diff_diff._rust_backend import sc_weight_fw as rust_fn
+        from diff_diff.utils import _sc_weight_fw_numpy as numpy_fn
+
+        np.random.seed(42)
+        Y = np.random.randn(8, 6)  # 8 rows, 5 pre + 1 target
+        rust_w = rust_fn(Y, 0.5, True, None, 1e-3, 1000)
+        numpy_w = numpy_fn(Y, 0.5, True, None, 1e-3, 1000)
+        np.testing.assert_array_almost_equal(
+            rust_w, numpy_w, decimal=6,
+            err_msg="Frank-Wolfe weights should match"
+        )
+
+    def test_sc_weight_fw_with_init_weights(self):
+        """Test Frank-Wolfe with initial weights."""
+        from diff_diff._rust_backend import sc_weight_fw as rust_fn
+        from diff_diff.utils import _sc_weight_fw_numpy as numpy_fn
+
+        np.random.seed(42)
+        Y = np.random.randn(6, 5)
+        init_w = np.array([0.5, 0.3, 0.15, 0.05])
+        rust_w = rust_fn(Y, 0.2, True, init_w, 1e-3, 500)
+        numpy_w = numpy_fn(Y, 0.2, True, init_w, 1e-3, 500)
+        np.testing.assert_array_almost_equal(
+            rust_w, numpy_w, decimal=6,
+            err_msg="Frank-Wolfe with init weights should match"
+        )
+
+    def test_time_weights_on_simplex(self):
+        """Test Rust time weights are on simplex."""
+        from diff_diff._rust_backend import compute_time_weights as rust_fn
+
+        np.random.seed(42)
+        Y_pre = np.random.randn(8, 5)
+        Y_post = np.random.randn(3, 5)
+        weights = rust_fn(Y_pre, Y_post, 0.01, True, 1e-3, 1000)
+        assert abs(weights.sum() - 1.0) < 1e-6
+        assert np.all(weights >= -1e-6)
+        assert weights.shape == (8,)
+
+    def test_time_weights_match_numpy(self):
+        """Test Rust and NumPy time weights match (2-pass with sparsification)."""
+        from diff_diff._rust_backend import compute_time_weights as rust_fn
+        from diff_diff.utils import _sc_weight_fw_numpy, _sparsify
+
+        np.random.seed(42)
+        Y_pre = np.random.randn(6, 4)
+        Y_post = np.random.randn(2, 4)
+
+        min_decrease = 1e-3
+        max_iter_pre = 100
+        max_iter = 1000
+
+        # Rust implementation (2-pass with sparsification)
+        rust_w = rust_fn(Y_pre, Y_post, 0.01, True, min_decrease,
+                         max_iter_pre, max_iter)
+
+        # Python implementation (manual 2-pass matching Rust)
+        post_means = np.mean(Y_post, axis=0)
+        Y_time = np.column_stack([Y_pre.T, post_means])
+        lam = _sc_weight_fw_numpy(Y_time, 0.01, True, None,
+                                  min_decrease, max_iter_pre)
+        lam = _sparsify(lam)
+        numpy_w = _sc_weight_fw_numpy(Y_time, 0.01, True, lam,
+                                      min_decrease, max_iter)
+
+        np.testing.assert_array_almost_equal(
+            rust_w, numpy_w, decimal=6,
+            err_msg="Time weights should match"
+        )
+
+    def test_time_weights_single_preperiod(self):
+        """Test time weights with single pre-period returns [1.0]."""
+        from diff_diff._rust_backend import compute_time_weights as rust_fn
+
+        Y_pre = np.random.randn(1, 5)
+        Y_post = np.random.randn(2, 5)
+        weights = rust_fn(Y_pre, Y_post, 0.01)
+        assert weights.shape == (1,)
+        assert abs(weights[0] - 1.0) < 1e-10
+
+    def test_unit_weights_on_simplex(self):
+        """Test Rust unit weights are on simplex."""
+        from diff_diff._rust_backend import compute_sdid_unit_weights as rust_fn
+
+        np.random.seed(42)
+        Y_pre = np.random.randn(8, 5)
+        Y_tr_mean = np.random.randn(8)
+        weights = rust_fn(Y_pre, Y_tr_mean, 0.5, True, 1e-3, 100, 1000)
+        assert abs(weights.sum() - 1.0) < 1e-6
+        assert np.all(weights >= -1e-6)
+        assert weights.shape == (5,)
+
+    def test_unit_weights_match_numpy(self):
+        """Test Rust and NumPy unit weights match."""
+        from diff_diff._rust_backend import compute_sdid_unit_weights as rust_fn
+        from diff_diff.utils import _sc_weight_fw_numpy, _sparsify
+
+        np.random.seed(42)
+        Y_pre = np.random.randn(6, 4)
+        Y_tr_mean = np.random.randn(6)
+
+        # Rust implementation
+        rust_w = rust_fn(Y_pre, Y_tr_mean, 0.5, True, 1e-3, 100, 1000)
+
+        # Python implementation (manual)
+        Y_unit = np.column_stack([Y_pre, Y_tr_mean.reshape(-1, 1)])
+        omega = _sc_weight_fw_numpy(Y_unit, 0.5, True, None, 1e-3, 100)
+        omega = _sparsify(omega)
+        numpy_w = _sc_weight_fw_numpy(Y_unit, 0.5, True, omega, 1e-3, 1000)
+
+        np.testing.assert_array_almost_equal(
+            rust_w, numpy_w, decimal=6,
+            err_msg="Unit weights should match"
+        )
+
+    def test_unit_weights_single_control(self):
+        """Test unit weights with single control returns [1.0]."""
+        from diff_diff._rust_backend import compute_sdid_unit_weights as rust_fn
+
+        Y_pre = np.random.randn(5, 1)
+        Y_tr_mean = np.random.randn(5)
+        weights = rust_fn(Y_pre, Y_tr_mean, 0.5)
+        assert weights.shape == (1,)
+        assert abs(weights[0] - 1.0) < 1e-10
+
+    def test_full_sdid_rust_vs_python(self):
+        """Test full SDID estimation produces same results with Rust and Python."""
+        import pandas as pd
+        from unittest.mock import patch
+        import sys
+        from diff_diff import SyntheticDiD
+
+        np.random.seed(42)
+        n_control, n_treated, n_pre, n_post = 8, 1, 6, 2
+        true_effect = 3.0
+        data = []
+        for i in range(n_control + n_treated):
+            is_treated = i >= n_control
+            for t in range(n_pre + n_post):
+                post = t >= n_pre
+                y = 1.0 + 0.5 * i + 0.3 * t + np.random.randn() * 0.3
+                if is_treated and post:
+                    y += true_effect
+                data.append({
+                    'unit': i, 'time': t, 'outcome': y,
+                    'treated': 1 if is_treated else 0,
+                    'post': 1 if post else 0,
+                })
+        df = pd.DataFrame(data)
+        post_periods = list(range(n_pre, n_pre + n_post))
+
+        # Run with Rust backend
+        sdid_rust = SyntheticDiD(variance_method="placebo", seed=42)
+        results_rust = sdid_rust.fit(df, 'outcome', 'treated', 'unit', 'time', post_periods)
+
+        # Run with Python backend
+        utils_mod = sys.modules['diff_diff.utils']
+        with patch.object(utils_mod, 'HAS_RUST_BACKEND', False):
+            sdid_py = SyntheticDiD(variance_method="placebo", seed=42)
+            results_py = sdid_py.fit(df.copy(), 'outcome', 'treated', 'unit', 'time', post_periods)
+
+        # ATT should be very close
+        np.testing.assert_almost_equal(
+            results_rust.att, results_py.att, decimal=4,
+            err_msg="Rust and Python ATT should match"
+        )
+
+
+@pytest.mark.skipif(not HAS_RUST_BACKEND, reason="Rust backend not available")
+class TestSDIDVarianceRustBackend:
+    """Test suite for SDID parallel variance estimation in Rust."""
+
+    @staticmethod
+    def _make_sdid_data(n_control=10, n_treated=2, n_pre=6, n_post=2,
+                        true_effect=3.0, seed=42):
+        """Create well-conditioned SDID test data."""
+        rng = np.random.default_rng(seed)
+        Y_pre_control = rng.standard_normal((n_pre, n_control))
+        Y_post_control = rng.standard_normal((n_post, n_control))
+        Y_pre_treated = rng.standard_normal((n_pre, n_treated))
+        Y_post_treated = Y_pre_treated[:n_post, :] + true_effect + rng.standard_normal((n_post, n_treated)) * 0.3
+
+        Y_pre_treated_mean = np.mean(Y_pre_treated, axis=1)
+        Y_post_treated_mean = np.mean(Y_post_treated, axis=1)
+
+        return (Y_pre_control, Y_post_control, Y_pre_treated,
+                Y_post_treated, Y_pre_treated_mean, Y_post_treated_mean)
+
+    def test_placebo_se_returns_valid(self):
+        """Rust placebo SE produces valid float > 0."""
+        from diff_diff._rust_backend import placebo_variance_sdid
+
+        data = self._make_sdid_data()
+        Y_pre_c, Y_post_c, _, _, Y_pre_t_mean, Y_post_t_mean = data
+
+        se, estimates = placebo_variance_sdid(
+            Y_pre_c, Y_post_c, Y_pre_t_mean, Y_post_t_mean,
+            2,    # n_treated
+            0.5,  # zeta_omega
+            0.01, # zeta_lambda
+            1e-5, # min_decrease
+            True, 100, 10000, 50, 42,
+        )
+
+        assert isinstance(se, float)
+        assert se > 0, f"SE should be > 0, got {se}"
+        assert np.isfinite(se), f"SE should be finite, got {se}"
+        assert len(estimates) > 0, "Should have some estimates"
+
+    def test_placebo_se_reproducible(self):
+        """Same seed produces same SE and estimates."""
+        from diff_diff._rust_backend import placebo_variance_sdid
+
+        data = self._make_sdid_data()
+        Y_pre_c, Y_post_c, _, _, Y_pre_t_mean, Y_post_t_mean = data
+
+        args = (Y_pre_c, Y_post_c, Y_pre_t_mean, Y_post_t_mean,
+                2, 0.5, 0.01, 1e-5, True, 100, 10000, 30, 42)
+
+        se1, est1 = placebo_variance_sdid(*args)
+        se2, est2 = placebo_variance_sdid(*args)
+
+        assert abs(se1 - se2) < 1e-10, f"SEs should match: {se1} vs {se2}"
+        np.testing.assert_array_equal(est1, est2)
+
+    def test_placebo_estimates_correct_count(self):
+        """All replications succeed on well-conditioned data."""
+        from diff_diff._rust_backend import placebo_variance_sdid
+
+        data = self._make_sdid_data()
+        Y_pre_c, Y_post_c, _, _, Y_pre_t_mean, Y_post_t_mean = data
+        replications = 50
+
+        _, estimates = placebo_variance_sdid(
+            Y_pre_c, Y_post_c, Y_pre_t_mean, Y_post_t_mean,
+            2, 0.5, 0.01, 1e-5, True, 100, 10000, replications, 42,
+        )
+
+        assert len(estimates) == replications, \
+            f"Expected {replications} estimates, got {len(estimates)}"
+
+    def test_placebo_se_statistically_matches_python(self):
+        """Rust and Python SEs are within 30% (different RNG sequences)."""
+        from diff_diff._rust_backend import placebo_variance_sdid
+        from diff_diff.utils import (
+            compute_sdid_unit_weights as py_unit_weights,
+            compute_time_weights as py_time_weights,
+            compute_sdid_estimator,
+        )
+        from diff_diff.utils import _sum_normalize
+
+        data = self._make_sdid_data(seed=123)
+        Y_pre_c, Y_post_c, _, _, Y_pre_t_mean, Y_post_t_mean = data
+        n_treated = 2
+        replications = 100
+
+        # Rust SE (average over multiple seeds for stability)
+        rust_ses = []
+        for seed in [42, 43, 44]:
+            se_r, _ = placebo_variance_sdid(
+                Y_pre_c, Y_post_c, Y_pre_t_mean, Y_post_t_mean,
+                n_treated, 0.5, 0.01, 1e-5, True, 100, 10000, replications, seed,
+            )
+            rust_ses.append(se_r)
+        rust_mean_se = np.mean(rust_ses)
+
+        # Python SE (average over multiple seeds)
+        python_ses = []
+        for seed in [42, 43, 44]:
+            rng = np.random.default_rng(seed)
+            n_control = Y_pre_c.shape[1]
+            n_pseudo_control = n_control - n_treated
+            estimates = []
+            for _ in range(replications):
+                perm = rng.permutation(n_control)
+                pc_idx = perm[:n_pseudo_control]
+                pt_idx = perm[n_pseudo_control:]
+                y_pre_pc = Y_pre_c[:, pc_idx]
+                y_post_pc = Y_post_c[:, pc_idx]
+                y_pre_pt_mean = np.mean(Y_pre_c[:, pt_idx], axis=1)
+                y_post_pt_mean = np.mean(Y_post_c[:, pt_idx], axis=1)
+                omega = py_unit_weights(y_pre_pc, y_pre_pt_mean, zeta_omega=0.5, min_decrease=1e-5)
+                lam = py_time_weights(y_pre_pc, y_post_pc, zeta_lambda=0.01, min_decrease=1e-5)
+                tau = compute_sdid_estimator(y_pre_pc, y_post_pc, y_pre_pt_mean, y_post_pt_mean, omega, lam)
+                estimates.append(tau)
+            n = len(estimates)
+            py_se = np.sqrt((n - 1) / n) * np.std(estimates, ddof=1)
+            python_ses.append(py_se)
+        python_mean_se = np.mean(python_ses)
+
+        # SEs should be in the same ballpark (within 30%)
+        ratio = rust_mean_se / python_mean_se if python_mean_se > 0 else float('inf')
+        assert 0.7 < ratio < 1.3, \
+            f"SE ratio {ratio:.2f} out of range: Rust={rust_mean_se:.4f}, Python={python_mean_se:.4f}"
+
+    def test_placebo_insufficient_controls(self):
+        """Returns (0.0, []) when n_control <= n_treated."""
+        from diff_diff._rust_backend import placebo_variance_sdid
+
+        Y_pre_c = np.random.randn(5, 2)
+        Y_post_c = np.random.randn(2, 2)
+        Y_pre_t_mean = np.random.randn(5)
+        Y_post_t_mean = np.random.randn(2)
+
+        se, estimates = placebo_variance_sdid(
+            Y_pre_c, Y_post_c, Y_pre_t_mean, Y_post_t_mean,
+            3,    # n_treated > n_control=2
+            0.5, 0.01, 1e-5, True, 100, 10000, 50, 42,
+        )
+
+        assert se == 0.0
+        assert len(estimates) == 0
+
+    def test_bootstrap_se_returns_valid(self):
+        """Rust bootstrap SE produces valid float > 0."""
+        from diff_diff._rust_backend import bootstrap_variance_sdid
+
+        data = self._make_sdid_data()
+        Y_pre_c, Y_post_c, Y_pre_t, Y_post_t, _, _ = data
+
+        # Need unit/time weights
+        omega = np.ones(Y_pre_c.shape[1]) / Y_pre_c.shape[1]
+        lam = np.ones(Y_pre_c.shape[0]) / Y_pre_c.shape[0]
+
+        se, estimates, n_failed = bootstrap_variance_sdid(
+            Y_pre_c, Y_post_c, Y_pre_t, Y_post_t,
+            omega, lam, 50, 42,
+        )
+
+        assert isinstance(se, float)
+        assert se > 0, f"SE should be > 0, got {se}"
+        assert np.isfinite(se)
+        assert len(estimates) > 0
+
+    def test_bootstrap_se_reproducible(self):
+        """Same seed produces same SE."""
+        from diff_diff._rust_backend import bootstrap_variance_sdid
+
+        data = self._make_sdid_data()
+        Y_pre_c, Y_post_c, Y_pre_t, Y_post_t, _, _ = data
+        omega = np.ones(Y_pre_c.shape[1]) / Y_pre_c.shape[1]
+        lam = np.ones(Y_pre_c.shape[0]) / Y_pre_c.shape[0]
+
+        args = (Y_pre_c, Y_post_c, Y_pre_t, Y_post_t, omega, lam, 30, 42)
+
+        se1, est1, _ = bootstrap_variance_sdid(*args)
+        se2, est2, _ = bootstrap_variance_sdid(*args)
+
+        assert abs(se1 - se2) < 1e-10
+        np.testing.assert_array_equal(est1, est2)
+
+    def test_bootstrap_se_statistically_matches_python(self):
+        """Rust and Python bootstrap SEs are within 30%."""
+        from diff_diff._rust_backend import bootstrap_variance_sdid
+        from diff_diff.utils import compute_sdid_estimator, _sum_normalize
+
+        data = self._make_sdid_data(seed=99)
+        Y_pre_c, Y_post_c, Y_pre_t, Y_post_t, _, _ = data
+        n_control = Y_pre_c.shape[1]
+        n_treated = Y_pre_t.shape[1]
+        n_total = n_control + n_treated
+        n_pre = Y_pre_c.shape[0]
+        n_bootstrap = 200
+
+        omega = np.ones(n_control) / n_control
+        lam = np.ones(n_pre) / n_pre
+
+        # Rust SE
+        se_rust, _, _ = bootstrap_variance_sdid(
+            Y_pre_c, Y_post_c, Y_pre_t, Y_post_t,
+            omega, lam, n_bootstrap, 42,
+        )
+
+        # Python SE
+        Y_full = np.block([
+            [Y_pre_c, Y_pre_t],
+            [Y_post_c, Y_post_t]
+        ])
+        rng = np.random.default_rng(42)
+        py_estimates = []
+        for _ in range(n_bootstrap):
+            boot_idx = rng.choice(n_total, size=n_total, replace=True)
+            boot_is_control = boot_idx < n_control
+            if not np.any(boot_is_control) or np.all(boot_is_control):
+                continue
+            boot_omega = _sum_normalize(omega[boot_idx[boot_is_control]])
+            Y_boot = Y_full[:, boot_idx]
+            Y_boot_pre_t_mean = np.mean(Y_boot[:n_pre, ~boot_is_control], axis=1)
+            Y_boot_post_t_mean = np.mean(Y_boot[n_pre:, ~boot_is_control], axis=1)
+            tau = compute_sdid_estimator(
+                Y_boot[:n_pre, boot_is_control],
+                Y_boot[n_pre:, boot_is_control],
+                Y_boot_pre_t_mean, Y_boot_post_t_mean,
+                boot_omega, lam,
+            )
+            py_estimates.append(tau)
+        se_python = float(np.std(py_estimates, ddof=1))
+
+        ratio = se_rust / se_python if se_python > 0 else float('inf')
+        assert 0.5 < ratio < 2.0, \
+            f"Bootstrap SE ratio {ratio:.2f}: Rust={se_rust:.4f}, Python={se_python:.4f}"
+
+    def test_full_sdid_fit_uses_rust_variance(self):
+        """SyntheticDiD.fit() uses Rust variance when available and produces valid results."""
+        import pandas as pd
+        from diff_diff import SyntheticDiD
+
+        np.random.seed(42)
+        n_control, n_treated, n_pre, n_post = 8, 2, 6, 2
+        true_effect = 3.0
+        data = []
+        for i in range(n_control + n_treated):
+            is_treated = i >= n_control
+            for t in range(n_pre + n_post):
+                post = t >= n_pre
+                y = 1.0 + 0.5 * i + 0.3 * t + np.random.randn() * 0.3
+                if is_treated and post:
+                    y += true_effect
+                data.append({
+                    'unit': i, 'time': t, 'outcome': y,
+                    'treated': 1 if is_treated else 0,
+                })
+        df = pd.DataFrame(data)
+        post_periods = list(range(n_pre, n_pre + n_post))
+
+        # Fit with placebo variance (uses Rust)
+        sdid = SyntheticDiD(variance_method="placebo", n_bootstrap=50, seed=42)
+        results = sdid.fit(df, 'outcome', 'treated', 'unit', 'time', post_periods)
+
+        assert np.isfinite(results.att), f"ATT should be finite: {results.att}"
+        assert np.isfinite(results.se), f"SE should be finite: {results.se}"
+        assert results.se > 0, f"SE should be > 0: {results.se}"
+
+        # Fit with bootstrap variance (uses Rust)
+        sdid_boot = SyntheticDiD(variance_method="bootstrap", n_bootstrap=50, seed=42)
+        results_boot = sdid_boot.fit(df, 'outcome', 'treated', 'unit', 'time', post_periods)
+
+        assert np.isfinite(results_boot.att), f"Bootstrap ATT should be finite: {results_boot.att}"
+        assert np.isfinite(results_boot.se), f"Bootstrap SE should be finite: {results_boot.se}"
+        assert results_boot.se > 0, f"Bootstrap SE should be > 0: {results_boot.se}"
+
+
 class TestFallbackWhenNoRust:
     """Test that pure Python fallback works when Rust is unavailable."""
 
diff --git a/tests/test_utils.py b/tests/test_utils.py
index f063050e..4084ae3b 100644
--- a/tests/test_utils.py
+++ b/tests/test_utils.py
@@ -969,7 +969,7 @@ def test_returns_correct_number_of_effects(self, sdid_panel_data):
 
         # Compute weights
         unit_weights = compute_synthetic_weights(Y_pre_control, Y_pre_treated)
-        time_weights = compute_time_weights(Y_pre_control, Y_pre_treated)
+        time_weights = compute_time_weights(Y_pre_control, Y_post_control, zeta_lambda=1e-6)
 
         control_units = list(control_pivot.columns)
 
@@ -1001,7 +1001,7 @@ def test_placebo_effects_distribution(self, sdid_panel_data):
         Y_pre_treated = treated_mean.loc[pre_periods].values
 
         unit_weights = compute_synthetic_weights(Y_pre_control, Y_pre_treated)
-        time_weights = compute_time_weights(Y_pre_control, Y_pre_treated)
+        time_weights = compute_time_weights(Y_pre_control, Y_post_control, zeta_lambda=1e-6)
 
         control_units = list(control_pivot.columns)
 
@@ -1033,7 +1033,7 @@ def test_n_placebo_limits_output(self, sdid_panel_data):
         Y_pre_treated = treated_mean.loc[pre_periods].values
 
         unit_weights = compute_synthetic_weights(Y_pre_control, Y_pre_treated)
-        time_weights = compute_time_weights(Y_pre_control, Y_pre_treated)
+        time_weights = compute_time_weights(Y_pre_control, Y_post_control, zeta_lambda=1e-6)
 
         control_units = list(control_pivot.columns)
 
@@ -1111,42 +1111,52 @@ def test_min_weight_threshold(self):
 
 
 class TestComputeTimeWeightsEdgeCases:
-    """Edge case tests for compute_time_weights."""
+    """Edge case tests for compute_time_weights (new Frank-Wolfe signature)."""
 
     def test_single_period(self):
         """Test with single pre-treatment period."""
-        Y_control = np.array([[1.0, 2.0, 3.0]])
-        Y_treated = np.array([2.0])
+        Y_pre_control = np.array([[1.0, 2.0, 3.0]])
+        Y_post_control = np.array([[4.0, 5.0, 6.0]])
 
-        weights = compute_time_weights(Y_control, Y_treated)
+        weights = compute_time_weights(Y_pre_control, Y_post_control, zeta_lambda=0.01)
 
         assert len(weights) == 1
         assert abs(weights[0] - 1.0) < 1e-6
 
     def test_zeta_regularization_effect(self):
-        """Test that zeta affects weight uniformity."""
+        """Test that zeta_lambda affects weight uniformity."""
         np.random.seed(42)
-        Y_control = np.random.randn(10, 5)
-        Y_treated = np.random.randn(10)
+        Y_pre = np.random.randn(10, 5)
+        Y_post = np.random.randn(3, 5)
 
-        weights_low_zeta = compute_time_weights(Y_control, Y_treated, zeta=0.1)
-        weights_high_zeta = compute_time_weights(Y_control, Y_treated, zeta=10.0)
+        weights_low = compute_time_weights(Y_pre, Y_post, zeta_lambda=0.001)
+        weights_high = compute_time_weights(Y_pre, Y_post, zeta_lambda=100.0)
 
-        # High zeta should give more uniform weights
-        var_low = np.var(weights_low_zeta)
-        var_high = np.var(weights_high_zeta)
+        # High regularization should give more uniform weights
+        var_low = np.var(weights_low)
+        var_high = np.var(weights_high)
 
         assert var_high <= var_low + 0.01
 
-    def test_weights_all_positive(self):
-        """Test that time weights are all positive."""
+    def test_weights_nonnegative(self):
+        """Test that time weights are non-negative (simplex constraint)."""
         np.random.seed(42)
-        Y_control = np.random.randn(10, 5)
-        Y_treated = np.random.randn(10)
+        Y_pre = np.random.randn(10, 5)
+        Y_post = np.random.randn(3, 5)
+
+        weights = compute_time_weights(Y_pre, Y_post, zeta_lambda=0.01)
+
+        assert np.all(weights >= -1e-10)
+
+    def test_weights_sum_to_one(self):
+        """Test that time weights sum to 1."""
+        np.random.seed(42)
+        Y_pre = np.random.randn(10, 5)
+        Y_post = np.random.randn(3, 5)
 
-        weights = compute_time_weights(Y_control, Y_treated)
+        weights = compute_time_weights(Y_pre, Y_post, zeta_lambda=0.01)
 
-        assert np.all(weights > 0)
+        assert abs(np.sum(weights) - 1.0) < 1e-6
 
 
 # =============================================================================

From 7158bf0f39f2671d32a62e5e8f6be9a2157062ec Mon Sep 17 00:00:00 2001
From: igerber <isaac.gerber@gmail.com>
Date: Tue, 10 Feb 2026 16:16:30 -0500
Subject: [PATCH 2/9] Fix CI doctest failure, noise_level NaN bug, and address
 PR review feedback
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Wrap Unicode formula in Rust doc comment in ```text fence (fixes doctest CI)
- Guard noise_level for single first-diff element (size<=1 → 0.0, not NaN)
- Remove **kwargs from SyntheticDiD.__init__ (reject unknown params)
- Update Registry: placebo re-estimates weights (not fixed), convergence=1e-5
- Add tests: noise_level edge cases, placebo re-estimation pin, kwargs rejection

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
---
 diff_diff/synthetic_did.py     |   1 -
 diff_diff/utils.py             |   2 +-
 docs/methodology/REGISTRY.md   |  14 ++--
 rust/src/sdid_variance.rs      |   6 +-
 tests/test_estimators.py       |   5 ++
 tests/test_methodology_sdid.py | 127 +++++++++++++++++++++++++++++++++
 6 files changed, 145 insertions(+), 10 deletions(-)

diff --git a/diff_diff/synthetic_did.py b/diff_diff/synthetic_did.py
index f77d4ca4..5a790dae 100644
--- a/diff_diff/synthetic_did.py
+++ b/diff_diff/synthetic_did.py
@@ -140,7 +140,6 @@ def __init__(
         # Deprecated — accepted for backward compat, ignored with warning
         lambda_reg: Optional[float] = None,
         zeta: Optional[float] = None,
-        **kwargs,
     ):
         if lambda_reg is not None:
             warnings.warn(
diff --git a/diff_diff/utils.py b/diff_diff/utils.py
index 71f9d80f..0507e4ca 100644
--- a/diff_diff/utils.py
+++ b/diff_diff/utils.py
@@ -1196,7 +1196,7 @@ def _compute_noise_level_numpy(Y_pre_control: np.ndarray) -> float:
     # R: apply(Y[1:N0, 1:T0], 1, diff) computes diff per row (unit).
     # Our matrix is (T, N) so diff along axis=0 gives (T-1, N).
     first_diffs = np.diff(Y_pre_control, axis=0)  # (T_pre-1, N_co)
-    if first_diffs.size == 0:
+    if first_diffs.size <= 1:
         return 0.0
     return float(np.std(first_diffs, ddof=1))
 
diff --git a/docs/methodology/REGISTRY.md b/docs/methodology/REGISTRY.md
index b15ebef8..6bf04b02 100644
--- a/docs/methodology/REGISTRY.md
+++ b/docs/methodology/REGISTRY.md
@@ -622,19 +622,20 @@ step = clip(step, 0, 1)
 x_new = x + step × d_x
 ```
 
-Convergence criterion: stop when objective decrease < min_decrease² (default min_decrease=1e-3).
+Convergence criterion: stop when objective decrease < min_decrease² (default min_decrease = 1e-5 × noise_level, max_iter = 10000, max_iter_pre_sparsify = 100).
 
 *Standard errors:*
 
 - Default: Placebo variance estimator (Algorithm 4 in paper)
   1. Randomly permute control unit indices
   2. Split into pseudo-controls (first N_co - N_tr) and pseudo-treated (last N_tr)
-  3. Renormalize original unit weights for pseudo-controls: `ω_pseudo = _sum_normalize(ω[pseudo_control_idx])`
-  4. Compute SDID estimate with renormalized weights and **fixed** time weights (no re-estimation)
-  5. Repeat `replications` times (default 200)
-  6. `SE = sqrt((r-1)/r) × sd(placebo_estimates)` where r = number of successful replications
+  3. Re-estimate unit weights (Frank-Wolfe) on pseudo-control/pseudo-treated data
+  4. Re-estimate time weights (Frank-Wolfe) on pseudo-control data
+  5. Compute SDID estimate with re-estimated weights
+  6. Repeat `replications` times (default 200)
+  7. `SE = sqrt((r-1)/r) × sd(placebo_estimates)` where r = number of successful replications
 
-  This matches R's `synthdid::vcov(method="placebo")`.
+  This matches R's `synthdid::vcov(method="placebo")` which passes `update.omega=TRUE, update.lambda=TRUE` via `opts`.
 
 - Alternative: Bootstrap at unit level (matching R's `synthdid::vcov(method="bootstrap")`)
   1. Resample ALL units (control + treated) with replacement
@@ -670,6 +671,7 @@ Convergence criterion: stop when objective decrease < min_decrease² (default mi
 - [x] Auto-regularization: noise_level = sd(first_diffs), zeta_omega = (N1*T1)^0.25 * noise_level, zeta_lambda = 1e-6 * noise_level
 - [x] Sparsification: v[v <= max(v)/4] = 0; v = v/sum(v)
 - [x] Placebo SE formula: sqrt((r-1)/r) * sd(placebo_estimates)
+- [x] Placebo SE: re-estimates omega and lambda per replication (matching R's update.omega=TRUE, update.lambda=TRUE)
 - [x] Bootstrap: fixed weights (original lambda unchanged, omega renormalized for resampled controls)
 - [x] Returns both unit and time weights for interpretation
 - [x] Column centering (intercept=True) in Frank-Wolfe optimization
diff --git a/rust/src/sdid_variance.rs b/rust/src/sdid_variance.rs
index c08bdd7a..cae15cf4 100644
--- a/rust/src/sdid_variance.rs
+++ b/rust/src/sdid_variance.rs
@@ -63,8 +63,10 @@ fn column_means(matrix: &Array2<f64>, col_indices: &[usize]) -> Array1<f64> {
 ///
 /// Matches `compute_sdid_estimator` in Python's `utils.py:1587-1604`:
 ///
-///     τ̂ = (Ȳ_treated,post - Σ_t λ_t * Y_treated,t)
-///         - Σ_j ω_j * (Ȳ_j,post - Σ_t λ_t * Y_j,t)
+/// ```text
+/// τ̂ = (Ȳ_treated,post - Σ_t λ_t * Y_treated,t)
+///     - Σ_j ω_j * (Ȳ_j,post - Σ_t λ_t * Y_j,t)
+/// ```
 fn sdid_estimator_internal(
     y_pre_control: &Array2<f64>,
     y_post_control: &Array2<f64>,
diff --git a/tests/test_estimators.py b/tests/test_estimators.py
index ab394a2b..6bcc9f89 100644
--- a/tests/test_estimators.py
+++ b/tests/test_estimators.py
@@ -3071,6 +3071,11 @@ def test_more_pre_periods_than_control_units(self, ci_params):
         assert np.isfinite(results.att)
         assert results.se > 0
 
+    def test_unknown_kwargs_rejected(self):
+        """Unknown kwargs raise TypeError instead of being silently swallowed."""
+        with pytest.raises(TypeError):
+            SyntheticDiD(bogus_param=True)
+
 
 class TestSyntheticWeightsUtils:
     """Tests for synthetic weight utility functions."""
diff --git a/tests/test_methodology_sdid.py b/tests/test_methodology_sdid.py
index 812392c5..41c76d58 100644
--- a/tests/test_methodology_sdid.py
+++ b/tests/test_methodology_sdid.py
@@ -14,6 +14,7 @@
 from diff_diff.synthetic_did import SyntheticDiD
 from diff_diff.utils import (
     _compute_noise_level,
+    _compute_noise_level_numpy,
     _compute_regularization,
     _fw_step,
     _sc_weight_fw,
@@ -603,3 +604,129 @@ def test_default_variance_method_is_placebo(self):
         """Default variance_method should be 'placebo' (matching R)."""
         sdid = SyntheticDiD()
         assert sdid.variance_method == "placebo"
+
+
+class TestNoiseLevelEdgeCases:
+    """Edge case tests for _compute_noise_level_numpy."""
+
+    def test_noise_level_single_control_two_periods(self):
+        """noise_level returns 0.0 (not NaN) for 1 control, 2 pre-periods.
+
+        With shape (2, 1), first_diffs has size=1, and np.std([x], ddof=1)
+        would divide by zero → NaN. Guard ensures 0.0 is returned instead,
+        matching the Rust backend behavior.
+        """
+        Y = np.array([[1.0], [2.0]])  # (2, 1)
+        result = _compute_noise_level_numpy(Y)
+        assert result == 0.0
+        assert not np.isnan(result)
+
+    def test_noise_level_single_element_returns_zero(self):
+        """noise_level returns 0.0 when first_diffs has exactly 1 element."""
+        # (2, 1) → diff → (1, 1) → size=1 → return 0.0
+        Y = np.array([[5.0], [10.0]])
+        result = _compute_noise_level_numpy(Y)
+        assert result == 0.0
+
+    def test_noise_level_empty_returns_zero(self):
+        """noise_level returns 0.0 for single time period (no diffs possible)."""
+        Y = np.array([[1.0, 2.0, 3.0]])  # (1, 3)
+        result = _compute_noise_level_numpy(Y)
+        assert result == 0.0
+
+
+class TestPlaceboReestimation:
+    """Tests verifying placebo variance re-estimates weights (not fixed)."""
+
+    def test_placebo_reestimates_weights_not_fixed(self):
+        """Placebo variance re-estimates omega/lambda per replication (matching R).
+
+        Verifies the methodology choice: R's vcov(method='placebo') passes
+        update.omega=TRUE, update.lambda=TRUE, so weights are re-estimated
+        via Frank-Wolfe on each permutation — NOT renormalized from originals.
+
+        We verify this by comparing the actual placebo SE against a manual
+        fixed-weight computation; if they differ, re-estimation is happening.
+        """
+        # Need enough controls for placebo to work (n_control > n_treated)
+        # and enough variation for weights to differ between re-estimation
+        # and renormalization.
+        df = _make_panel(n_control=15, n_treated=2, n_pre=6, n_post=3,
+                         att=5.0, seed=123)
+        post_periods = list(range(6, 9))
+
+        # Fit SDID to get original weights and matrices
+        sdid = SyntheticDiD(variance_method="placebo", n_bootstrap=50, seed=42)
+        results = sdid.fit(
+            df,
+            outcome="outcome",
+            treatment="treated",
+            unit="unit",
+            time="period",
+            post_periods=post_periods,
+        )
+        actual_se = results.se
+
+        # Now compute a "fixed weight" placebo manually:
+        # permute controls, renormalize original omega (no Frank-Wolfe),
+        # keep original lambda unchanged.
+        rng = np.random.default_rng(42)
+
+        # Build the outcome matrix (T, N) as the estimator does
+        pivot = df.pivot(index="period", columns="unit", values="outcome")
+        control_units = sorted(results.unit_weights.keys())
+        treated_mask = df.groupby("unit")["treated"].max().values.astype(bool)
+        control_idx = np.where(~treated_mask)[0]
+        treated_idx = np.where(treated_mask)[0]
+        Y = pivot.values  # (T, N)
+        pre_periods_arr = np.array(post_periods)
+        pre_mask = ~np.isin(pivot.index.values, pre_periods_arr)
+
+        Y_pre_control = Y[np.ix_(pre_mask, control_idx)]
+        Y_post_control = Y[np.ix_(~pre_mask, control_idx)]
+
+        # Extract numpy arrays from result dicts (ordered by control unit)
+        unit_weights_arr = np.array([results.unit_weights[u] for u in control_units])
+        time_weights_arr = np.array([results.time_weights[t]
+                                     for t in sorted(results.time_weights.keys())])
+
+        n_control = len(control_idx)
+        n_treated_count = len(treated_idx)
+        n_pseudo_control = n_control - n_treated_count
+
+        fixed_estimates = []
+        for _ in range(50):
+            perm = rng.permutation(n_control)
+            pc_idx = perm[:n_pseudo_control]
+            pt_idx = perm[n_pseudo_control:]
+
+            # Fixed weights: renormalize original omega for pseudo-controls
+            fixed_omega = _sum_normalize(unit_weights_arr[pc_idx])
+            fixed_lambda = time_weights_arr  # unchanged
+
+            Y_pre_pc = Y_pre_control[:, pc_idx]
+            Y_post_pc = Y_post_control[:, pc_idx]
+            Y_pre_pt_mean = np.mean(Y_pre_control[:, pt_idx], axis=1)
+            Y_post_pt_mean = np.mean(Y_post_control[:, pt_idx], axis=1)
+
+            try:
+                tau = compute_sdid_estimator(
+                    Y_pre_pc, Y_post_pc,
+                    Y_pre_pt_mean, Y_post_pt_mean,
+                    fixed_omega, fixed_lambda,
+                )
+                fixed_estimates.append(tau)
+            except (ValueError, np.linalg.LinAlgError):
+                continue
+
+        if len(fixed_estimates) >= 2:
+            n_s = len(fixed_estimates)
+            fixed_se = (np.sqrt((n_s - 1) / n_s)
+                        * np.std(fixed_estimates, ddof=1))
+            # The two SEs should differ because re-estimation produces
+            # different weights than renormalization
+            assert actual_se != pytest.approx(fixed_se, rel=0.01), (
+                f"Placebo SE ({actual_se:.6f}) matches fixed-weight SE "
+                f"({fixed_se:.6f}), suggesting weights are NOT being "
+                f"re-estimated as R's synthdid does."
+            )

From c62d3bcc6b78aae0a7bbc4976745fa162a1a6a4a Mon Sep 17 00:00:00 2001
From: igerber <isaac.gerber@gmail.com>
Date: Tue, 10 Feb 2026 18:18:12 -0500
Subject: [PATCH 3/9] Add input validation, pre-fit warning, and docs fixes
 from AI review round 2
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Address 5 issues from PR #145 AI review:
- P0: Validate treatment is constant within unit (reject staggered designs)
- P1: Enforce balanced panel (all units must have all periods)
- P1: Warn when pre-treatment fit RMSE exceeds treated outcome SD
- P1: Fix Registry FW iteration count (1000 → 10000, matching R/code)
- P2: Fix misleading placebo docstring (weights use fresh start, not warm start)

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
---
 diff_diff/synthetic_did.py     |  51 ++++++++++-
 docs/methodology/REGISTRY.md   |   7 +-
 tests/test_methodology_sdid.py | 163 +++++++++++++++++++++++++++++++++
 3 files changed, 218 insertions(+), 3 deletions(-)

diff --git a/diff_diff/synthetic_did.py b/diff_diff/synthetic_did.py
index 5a790dae..31104f2e 100644
--- a/diff_diff/synthetic_did.py
+++ b/diff_diff/synthetic_did.py
@@ -267,6 +267,24 @@ def fit(  # type: ignore[override]
         # Identify treated and control units
         # Treatment indicator should be constant within unit
         unit_treatment = data.groupby(unit)[treatment].first()
+
+        # Validate treatment is constant within unit (SDID requires block treatment)
+        treatment_nunique = data.groupby(unit)[treatment].nunique()
+        varying_units = treatment_nunique[treatment_nunique > 1]
+        if len(varying_units) > 0:
+            example_unit = varying_units.index[0]
+            example_vals = sorted(
+                data.loc[data[unit] == example_unit, treatment].unique()
+            )
+            raise ValueError(
+                f"Treatment indicator varies within {len(varying_units)} unit(s) "
+                f"(e.g., unit '{example_unit}' has values {example_vals}). "
+                f"SyntheticDiD requires 'block' treatment where treatment is "
+                f"constant within each unit across all time periods. "
+                f"For staggered adoption designs, use CallawaySantAnna or "
+                f"ImputationDiD instead."
+            )
+
         treated_units = unit_treatment[unit_treatment == 1].index.tolist()
         control_units = unit_treatment[unit_treatment == 0].index.tolist()
 
@@ -275,6 +293,21 @@ def fit(  # type: ignore[override]
         if len(control_units) == 0:
             raise ValueError("No control units found")
 
+        # Validate balanced panel (SDID requires all units observed in all periods)
+        periods_per_unit = data.groupby(unit)[time].nunique()
+        expected_n_periods = len(all_periods)
+        unbalanced_units = periods_per_unit[periods_per_unit != expected_n_periods]
+        if len(unbalanced_units) > 0:
+            example_unit = unbalanced_units.index[0]
+            actual_count = unbalanced_units.iloc[0]
+            raise ValueError(
+                f"Panel is not balanced: {len(unbalanced_units)} unit(s) do not "
+                f"have observations in all {expected_n_periods} periods "
+                f"(e.g., unit '{example_unit}' has {actual_count} periods). "
+                f"SyntheticDiD requires a balanced panel. Use "
+                f"diff_diff.prep.balance_panel() to balance the panel first."
+            )
+
         # Residualize covariates if provided
         working_data = data.copy()
         if covariates:
@@ -338,6 +371,22 @@ def fit(  # type: ignore[override]
         synthetic_pre = Y_pre_control @ unit_weights
         pre_fit_rmse = np.sqrt(np.mean((Y_pre_treated_mean - synthetic_pre) ** 2))
 
+        # Warn if pre-treatment fit is poor (Registry requirement).
+        # Threshold: 1× SD of treated pre-treatment outcomes — a natural baseline
+        # since RMSE exceeding natural variation indicates the synthetic control
+        # fails to reproduce the treated series' level or trend.
+        pre_treatment_sd = np.std(Y_pre_treated_mean, ddof=1) if len(Y_pre_treated_mean) > 1 else 0.0
+        if pre_treatment_sd > 0 and pre_fit_rmse > pre_treatment_sd:
+            warnings.warn(
+                f"Pre-treatment fit is poor: RMSE ({pre_fit_rmse:.4f}) exceeds "
+                f"the standard deviation of treated pre-treatment outcomes "
+                f"({pre_treatment_sd:.4f}). The synthetic control may not "
+                f"adequately reproduce treated unit trends. Consider adding "
+                f"more control units or adjusting regularization.",
+                UserWarning,
+                stacklevel=2,
+            )
+
         # Compute standard errors based on variance_method
         if self.variance_method == "bootstrap":
             se, bootstrap_estimates = self._bootstrap_se(
@@ -814,7 +863,7 @@ def _placebo_variance_se(
 
                 # Re-estimate weights on permuted data (matching R's behavior)
                 # R passes update.omega=TRUE, update.lambda=TRUE via opts,
-                # using original weights as starting points for FW optimization.
+                # re-estimating weights from uniform initialization (fresh start).
                 # Unit weights: re-estimate on pseudo-control/pseudo-treated data
                 pseudo_omega = compute_sdid_unit_weights(
                     Y_pre_pseudo_control,
diff --git a/docs/methodology/REGISTRY.md b/docs/methodology/REGISTRY.md
index 6bf04b02..ed022881 100644
--- a/docs/methodology/REGISTRY.md
+++ b/docs/methodology/REGISTRY.md
@@ -587,7 +587,7 @@ where A = Y_unit[:, :N_co], b = Y_unit[:, N_co], and centering is column-wise (i
 **Two-pass sparsification procedure** (matches R's `synthdid::sc.weight.fw` + `sparsify_function`):
 1. First pass: Run Frank-Wolfe for 100 iterations (max_iter_pre_sparsify) from uniform initialization
 2. Sparsify: `v[v <= max(v)/4] = 0; v = v / sum(v)` (zero out small weights, renormalize)
-3. Second pass: Run Frank-Wolfe for 1000 iterations (max_iter) starting from sparsified weights
+3. Second pass: Run Frank-Wolfe for 10000 iterations (max_iter) starting from sparsified weights
 
 The sparsification step concentrates weights on the most important control units, improving interpretability and stability.
 
@@ -659,13 +659,16 @@ Convergence criterion: stop when objective decrease < min_decrease² (default mi
 - **Noise level with < 2 pre-periods**: Returns 0.0, which makes both zeta_omega and zeta_lambda equal to 0.0 (no regularization).
 - **NaN inference for undefined statistics**: t_stat uses NaN when SE is zero or non-finite; p_value and CI also NaN. Matches CallawaySantAnna NaN convention.
 - **Placebo p-value floor**: `p_value = max(empirical_p, 1/(n_replications + 1))` to avoid reporting exactly zero.
+- **Varying treatment within unit**: Raises `ValueError`. SDID requires block treatment (constant within each unit). Suggests CallawaySantAnna or ImputationDiD for staggered adoption.
+- **Unbalanced panel**: Raises `ValueError`. SDID requires all units observed in all periods. Suggests `balance_panel()`.
+- **Poor pre-treatment fit**: Warns (`UserWarning`) when `pre_fit_rmse > std(treated_pre_outcomes, ddof=1)`. Diagnostic only; estimation proceeds.
 
 **Reference implementation(s):**
 - R: `synthdid::synthdid_estimate()` (Arkhangelsky et al.'s official package)
 - Key R functions matched: `sc.weight.fw()` (Frank-Wolfe), `sparsify_function` (sparsification), `vcov.synthdid_estimate()` (variance)
 
 **Requirements checklist:**
-- [x] Unit weights: Frank-Wolfe on collapsed form (T_pre, N_co+1), two-pass sparsification (100 iters -> sparsify -> 1000 iters)
+- [x] Unit weights: Frank-Wolfe on collapsed form (T_pre, N_co+1), two-pass sparsification (100 iters -> sparsify -> 10000 iters)
 - [x] Time weights: Frank-Wolfe on collapsed form (N_co, T_pre+1), last column = per-control post mean
 - [x] Unit and time weights: sum to 1, non-negative (simplex constraint)
 - [x] Auto-regularization: noise_level = sd(first_diffs), zeta_omega = (N1*T1)^0.25 * noise_level, zeta_lambda = 1e-6 * noise_level
diff --git a/tests/test_methodology_sdid.py b/tests/test_methodology_sdid.py
index 41c76d58..75668f37 100644
--- a/tests/test_methodology_sdid.py
+++ b/tests/test_methodology_sdid.py
@@ -11,6 +11,8 @@
 import numpy as np
 import pytest
 
+import pandas as pd
+
 from diff_diff.synthetic_did import SyntheticDiD
 from diff_diff.utils import (
     _compute_noise_level,
@@ -730,3 +732,164 @@ def test_placebo_reestimates_weights_not_fixed(self):
                 f"({fixed_se:.6f}), suggesting weights are NOT being "
                 f"re-estimated as R's synthdid does."
             )
+
+
+# =============================================================================
+# Treatment Validation
+# =============================================================================
+
+
+class TestTreatmentValidation:
+    """Test that SDID rejects time-varying treatment (staggered designs)."""
+
+    def test_varying_treatment_within_unit_raises(self):
+        """Unit whose treatment switches over time should raise ValueError."""
+        np.random.seed(42)
+        data = pd.DataFrame({
+            "unit": [1, 1, 1, 1, 2, 2, 2, 2, 3, 3, 3, 3],
+            "time": [1, 2, 3, 4, 1, 2, 3, 4, 1, 2, 3, 4],
+            "outcome": np.random.randn(12),
+            # Unit 1: treatment turns on at time 3 (staggered)
+            "treated": [0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0],
+        })
+        sdid = SyntheticDiD()
+        with pytest.raises(ValueError, match="Treatment indicator varies within"):
+            sdid.fit(
+                data, outcome="outcome", treatment="treated",
+                unit="unit", time="time", post_periods=[3, 4],
+            )
+
+    def test_constant_treatment_passes(self):
+        """Normal block-treatment data should pass validation."""
+        np.random.seed(42)
+        n_units, n_periods = 10, 8
+        rows = []
+        for u in range(n_units):
+            is_treated = 1 if u < 3 else 0
+            for t in range(n_periods):
+                rows.append({
+                    "unit": u, "time": t,
+                    "outcome": np.random.randn() + (2.0 if is_treated and t >= 5 else 0),
+                    "treated": is_treated,
+                })
+        data = pd.DataFrame(rows)
+        sdid = SyntheticDiD()
+        result = sdid.fit(
+            data, outcome="outcome", treatment="treated",
+            unit="unit", time="time", post_periods=[5, 6, 7],
+        )
+        assert result is not None
+
+
+# =============================================================================
+# Balanced Panel Validation
+# =============================================================================
+
+
+class TestBalancedPanelValidation:
+    """Test that SDID rejects unbalanced panels."""
+
+    def test_unbalanced_panel_raises(self):
+        """Unit missing a period should raise ValueError."""
+        np.random.seed(42)
+        rows = []
+        for u in range(6):
+            is_treated = 1 if u < 2 else 0
+            for t in range(5):
+                rows.append({
+                    "unit": u, "time": t,
+                    "outcome": np.random.randn(),
+                    "treated": is_treated,
+                })
+        data = pd.DataFrame(rows)
+        # Drop one observation to make panel unbalanced
+        data = data[~((data["unit"] == 3) & (data["time"] == 2))].reset_index(drop=True)
+
+        sdid = SyntheticDiD()
+        with pytest.raises(ValueError, match="Panel is not balanced"):
+            sdid.fit(
+                data, outcome="outcome", treatment="treated",
+                unit="unit", time="time", post_periods=[3, 4],
+            )
+
+    def test_balanced_panel_passes(self):
+        """Fully balanced panel should pass validation."""
+        np.random.seed(42)
+        rows = []
+        for u in range(8):
+            is_treated = 1 if u < 2 else 0
+            for t in range(6):
+                rows.append({
+                    "unit": u, "time": t,
+                    "outcome": np.random.randn() + (1.5 if is_treated and t >= 4 else 0),
+                    "treated": is_treated,
+                })
+        data = pd.DataFrame(rows)
+        sdid = SyntheticDiD()
+        result = sdid.fit(
+            data, outcome="outcome", treatment="treated",
+            unit="unit", time="time", post_periods=[4, 5],
+        )
+        assert result is not None
+
+
+# =============================================================================
+# Pre-treatment Fit Warning
+# =============================================================================
+
+
+class TestPreTreatmentFitWarning:
+    """Test that poor pre-treatment fit emits a warning."""
+
+    def test_poor_fit_emits_warning(self):
+        """Treated units at very different level from controls should warn."""
+        np.random.seed(42)
+        rows = []
+        for u in range(10):
+            is_treated = 1 if u < 2 else 0
+            # Large level difference: treated ~100, control ~10
+            level = 100.0 if is_treated else 10.0
+            for t in range(8):
+                rows.append({
+                    "unit": u, "time": t,
+                    "outcome": level + np.random.randn() * 0.5,
+                    "treated": is_treated,
+                })
+        data = pd.DataFrame(rows)
+        sdid = SyntheticDiD()
+        with warnings.catch_warnings(record=True) as w:
+            warnings.simplefilter("always")
+            sdid.fit(
+                data, outcome="outcome", treatment="treated",
+                unit="unit", time="time", post_periods=[6, 7],
+            )
+            fit_warnings = [x for x in w if "Pre-treatment fit is poor" in str(x.message)]
+            assert len(fit_warnings) >= 1, (
+                "Expected warning about poor pre-treatment fit but none was raised"
+            )
+
+    def test_good_fit_no_warning(self):
+        """Parallel trends data with similar levels should not warn."""
+        np.random.seed(42)
+        rows = []
+        for u in range(10):
+            is_treated = 1 if u < 3 else 0
+            for t in range(8):
+                # Same level, parallel trends, treatment effect only in post
+                rows.append({
+                    "unit": u, "time": t,
+                    "outcome": t + np.random.randn() * 0.3 + (2.0 if is_treated and t >= 5 else 0),
+                    "treated": is_treated,
+                })
+        data = pd.DataFrame(rows)
+        sdid = SyntheticDiD()
+        with warnings.catch_warnings(record=True) as w:
+            warnings.simplefilter("always")
+            sdid.fit(
+                data, outcome="outcome", treatment="treated",
+                unit="unit", time="time", post_periods=[5, 6, 7],
+            )
+            fit_warnings = [x for x in w if "Pre-treatment fit is poor" in str(x.message)]
+            assert len(fit_warnings) == 0, (
+                f"Unexpected pre-treatment fit warning: {fit_warnings[0].message}"
+            )

From ced46f265aaada378e8b925f61a6648399d1cfea Mon Sep 17 00:00:00 2001
From: igerber <isaac.gerber@gmail.com>
Date: Tue, 10 Feb 2026 18:37:05 -0500
Subject: [PATCH 4/9] Document min_decrease floor for zero noise and guard
 empty Y_post_control
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Address AI review round 3: (1) Document the 1e-5 min_decrease floor when
noise_level == 0 as an intentional deviation from R in REGISTRY.md and
inline comment — enables early stopping with equivalent results.
(2) Add ValueError guard in compute_time_weights for empty Y_post_control
before both Python and Rust dispatch paths.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
---
 diff_diff/synthetic_did.py     |  5 ++++-
 diff_diff/utils.py             |  6 ++++++
 docs/methodology/REGISTRY.md   |  2 +-
 tests/test_methodology_sdid.py | 34 ++++++++++++++++++++++++++++++++++
 4 files changed, 45 insertions(+), 2 deletions(-)

diff --git a/diff_diff/synthetic_did.py b/diff_diff/synthetic_did.py
index 31104f2e..02a8db16 100644
--- a/diff_diff/synthetic_did.py
+++ b/diff_diff/synthetic_did.py
@@ -334,7 +334,10 @@ def fit(  # type: ignore[override]
         from diff_diff.utils import _compute_noise_level
         noise_level = _compute_noise_level(Y_pre_control)
 
-        # Data-dependent convergence threshold (matches R's 1e-5 * noise.level)
+        # Data-dependent convergence threshold (matches R's 1e-5 * noise.level).
+        # Floor of 1e-5 when noise_level == 0: R would use 0.0, causing FW to
+        # run all max_iter iterations.  The result is equivalent (zero-noise
+        # data has no variation to optimize), but the floor enables early stop.
         min_decrease = 1e-5 * noise_level if noise_level > 0 else 1e-5
 
         # Compute unit weights (Frank-Wolfe with sparsification)
diff --git a/diff_diff/utils.py b/diff_diff/utils.py
index 0507e4ca..874facb6 100644
--- a/diff_diff/utils.py
+++ b/diff_diff/utils.py
@@ -1420,6 +1420,12 @@ def compute_time_weights(
     np.ndarray
         Time weights of shape (n_pre,) on the simplex.
     """
+    if Y_post_control.shape[0] == 0:
+        raise ValueError(
+            "Y_post_control has no rows. At least one post-treatment period "
+            "is required for time weight computation."
+        )
+
     if HAS_RUST_BACKEND:
         return np.asarray(_rust_compute_time_weights(
             np.ascontiguousarray(Y_pre_control, dtype=np.float64),
diff --git a/docs/methodology/REGISTRY.md b/docs/methodology/REGISTRY.md
index ed022881..378c25d0 100644
--- a/docs/methodology/REGISTRY.md
+++ b/docs/methodology/REGISTRY.md
@@ -656,7 +656,7 @@ Convergence criterion: stop when objective decrease < min_decrease² (default mi
 - **Negative weights attempted**: Frank-Wolfe operates on the simplex (non-negative, sum-to-1), so weights are always feasible by construction. The step size is clipped to [0, 1] and the move is toward a simplex vertex.
 - **Perfect pre-treatment fit**: Regularization (ζ² ||ω||²) prevents overfitting by penalizing weight concentration.
 - **Single treated unit**: Valid; placebo variance uses jackknife-style permutations of controls.
-- **Noise level with < 2 pre-periods**: Returns 0.0, which makes both zeta_omega and zeta_lambda equal to 0.0 (no regularization).
+- **Noise level with < 2 pre-periods**: Returns 0.0, which makes both zeta_omega and zeta_lambda equal to 0.0 (no regularization). **Note (deviation from R):** `min_decrease` uses a `1e-5` floor when `noise_level == 0` to enable Frank-Wolfe early stopping. R would use `0.0`, causing FW to run all `max_iter` iterations; the result is equivalent since zero-noise data has no variation to optimize.
 - **NaN inference for undefined statistics**: t_stat uses NaN when SE is zero or non-finite; p_value and CI also NaN. Matches CallawaySantAnna NaN convention.
 - **Placebo p-value floor**: `p_value = max(empirical_p, 1/(n_replications + 1))` to avoid reporting exactly zero.
 - **Varying treatment within unit**: Raises `ValueError`. SDID requires block treatment (constant within each unit). Suggests CallawaySantAnna or ImputationDiD for staggered adoption.
diff --git a/tests/test_methodology_sdid.py b/tests/test_methodology_sdid.py
index 75668f37..5db1e6a2 100644
--- a/tests/test_methodology_sdid.py
+++ b/tests/test_methodology_sdid.py
@@ -893,3 +893,37 @@ def test_good_fit_no_warning(self):
             assert len(fit_warnings) == 0, (
                 f"Unexpected pre-treatment fit warning: {fit_warnings[0].message}"
             )
+
+
+class TestMinDecreaseFloor:
+    """Test min_decrease floor when noise_level == 0."""
+
+    def test_floor_equivalence(self):
+        """min_decrease=1e-5 floor vs 0.0 gives same weights on zero-noise data."""
+        # Build zero-noise collapsed-form matrix (N_co=5, T_pre+1=4)
+        # All rows identical → noise_level would be 0
+        np.random.seed(42)
+        Y = np.tile(np.array([1.0, 2.0, 3.0, 4.0]), (5, 1))
+
+        w_floor = _sc_weight_fw(Y, zeta=0.0, intercept=True,
+                                min_decrease=1e-5, max_iter=10000)
+        w_zero = _sc_weight_fw(Y, zeta=0.0, intercept=True,
+                               min_decrease=0.0, max_iter=10000)
+
+        np.testing.assert_allclose(w_floor, w_zero, atol=1e-10,
+                                   err_msg="Floor min_decrease should give same weights as 0.0")
+        # Both should be valid simplex weights
+        assert np.all(w_floor >= -1e-12), "Weights should be non-negative"
+        assert abs(w_floor.sum() - 1.0) < 1e-10, "Weights should sum to 1"
+
+
+class TestEmptyPostGuard:
+    """Test compute_time_weights guard for empty Y_post_control."""
+
+    def test_empty_post_raises(self):
+        """compute_time_weights raises ValueError when Y_post_control has 0 rows."""
+        Y_pre = np.random.randn(4, 5)   # 4 pre-periods, 5 controls
+        Y_post = np.empty((0, 5))        # 0 post-periods
+
+        with pytest.raises(ValueError, match="Y_post_control has no rows"):
+            compute_time_weights(Y_pre, Y_post, zeta_lambda=0.0)

From 36ca9a97587baa11abdd560987dfe40a0baf0d2b Mon Sep 17 00:00:00 2001
From: igerber <isaac.gerber@gmail.com>
Date: Tue, 10 Feb 2026 18:59:38 -0500
Subject: [PATCH 5/9] Deprecate compute_placebo_effects and fix placebo
 docstring from AI review round 4

Deprecate the legacy compute_placebo_effects utility (uses projected-gradient
weights with fixed time weights, not matching SDID Algorithm 4). Fix
_placebo_variance_se docstring to say "uniform initialization" instead of
"original weights as initialization", matching the actual implementation.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
---
 diff_diff/synthetic_did.py |  4 +--
 diff_diff/utils.py         | 14 ++++++++++
 tests/test_utils.py        | 53 ++++++++++++++++++++------------------
 3 files changed, 44 insertions(+), 27 deletions(-)

diff --git a/diff_diff/synthetic_did.py b/diff_diff/synthetic_did.py
index 02a8db16..9f692db2 100644
--- a/diff_diff/synthetic_did.py
+++ b/diff_diff/synthetic_did.py
@@ -737,8 +737,8 @@ def _placebo_variance_se(
 
         1. Randomly sample N₀ control indices (permutation)
         2. Designate last N₁ as pseudo-treated, first (N₀-N₁) as pseudo-controls
-        3. Re-estimate both omega and lambda on the permuted data (using
-           original weights as initialization), matching R's behavior where
+        3. Re-estimate both omega and lambda on the permuted data (from
+           uniform initialization, fresh start), matching R's behavior where
            ``update.omega=TRUE, update.lambda=TRUE`` are passed via ``opts``
         4. Compute SDID estimate with re-estimated weights
         5. Repeat `replications` times
diff --git a/diff_diff/utils.py b/diff_diff/utils.py
index 874facb6..7d227c8e 100644
--- a/diff_diff/utils.py
+++ b/diff_diff/utils.py
@@ -1651,7 +1651,21 @@ def compute_placebo_effects(
     For each control unit j, we pretend it was treated and compute
     the SDID estimate using the remaining controls. The distribution
     of these placebo effects provides a reference for inference.
+
+    .. deprecated::
+        This function uses legacy projected-gradient weights and fixed time
+        weights. Use ``SyntheticDiD(variance_method='placebo')`` instead.
     """
+    warnings.warn(
+        "compute_placebo_effects uses legacy projected-gradient weights and "
+        "fixed time weights, which does not match the SDID methodology "
+        "(Algorithm 4 requires re-estimating both omega and lambda per "
+        "placebo iteration). Use SyntheticDiD(variance_method='placebo') "
+        "for correct placebo inference. This function will be removed in a "
+        "future version.",
+        DeprecationWarning,
+        stacklevel=2,
+    )
     n_pre, n_control = Y_pre_control.shape
 
     if n_placebo is None:
diff --git a/tests/test_utils.py b/tests/test_utils.py
index 4084ae3b..b536bfa2 100644
--- a/tests/test_utils.py
+++ b/tests/test_utils.py
@@ -973,14 +973,15 @@ def test_returns_correct_number_of_effects(self, sdid_panel_data):
 
         control_units = list(control_pivot.columns)
 
-        placebo_effects = compute_placebo_effects(
-            Y_pre_control,
-            Y_post_control,
-            Y_pre_treated,
-            unit_weights,
-            time_weights,
-            control_units
-        )
+        with pytest.warns(DeprecationWarning, match="compute_placebo_effects uses legacy"):
+            placebo_effects = compute_placebo_effects(
+                Y_pre_control,
+                Y_post_control,
+                Y_pre_treated,
+                unit_weights,
+                time_weights,
+                control_units
+            )
 
         # Should have one placebo effect per control unit
         assert len(placebo_effects) == len(control_units)
@@ -1005,14 +1006,15 @@ def test_placebo_effects_distribution(self, sdid_panel_data):
 
         control_units = list(control_pivot.columns)
 
-        placebo_effects = compute_placebo_effects(
-            Y_pre_control,
-            Y_post_control,
-            Y_pre_treated,
-            unit_weights,
-            time_weights,
-            control_units
-        )
+        with pytest.warns(DeprecationWarning, match="compute_placebo_effects uses legacy"):
+            placebo_effects = compute_placebo_effects(
+                Y_pre_control,
+                Y_post_control,
+                Y_pre_treated,
+                unit_weights,
+                time_weights,
+                control_units
+            )
 
         # Placebo effects should be centered around zero (no treatment)
         assert np.abs(np.mean(placebo_effects)) < 2.0  # Allow some deviation
@@ -1037,15 +1039,16 @@ def test_n_placebo_limits_output(self, sdid_panel_data):
 
         control_units = list(control_pivot.columns)
 
-        placebo_effects = compute_placebo_effects(
-            Y_pre_control,
-            Y_post_control,
-            Y_pre_treated,
-            unit_weights,
-            time_weights,
-            control_units,
-            n_placebo=5
-        )
+        with pytest.warns(DeprecationWarning, match="compute_placebo_effects uses legacy"):
+            placebo_effects = compute_placebo_effects(
+                Y_pre_control,
+                Y_post_control,
+                Y_pre_treated,
+                unit_weights,
+                time_weights,
+                control_units,
+                n_placebo=5
+            )
 
         assert len(placebo_effects) == 5
 

From 3e89a1f75ca24969b7833debafc7b9ba263c621f Mon Sep 17 00:00:00 2001
From: igerber <isaac.gerber@gmail.com>
Date: Tue, 10 Feb 2026 19:18:40 -0500
Subject: [PATCH 6/9] Validate n_bootstrap >= 2 in SyntheticDiD to prevent
 ZeroDivisionError

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
---
 diff_diff/synthetic_did.py     |  7 +++++++
 tests/test_methodology_sdid.py | 10 ++++++++++
 2 files changed, 17 insertions(+)

diff --git a/diff_diff/synthetic_did.py b/diff_diff/synthetic_did.py
index 9f692db2..fdb98740 100644
--- a/diff_diff/synthetic_did.py
+++ b/diff_diff/synthetic_did.py
@@ -164,6 +164,13 @@ def __init__(
         self.n_bootstrap = n_bootstrap
         self.seed = seed
 
+        # Validate n_bootstrap
+        if n_bootstrap < 2:
+            raise ValueError(
+                f"n_bootstrap must be >= 2 (got {n_bootstrap}). At least 2 "
+                f"iterations are needed to estimate standard errors."
+            )
+
         # Validate variance_method
         valid_methods = ("bootstrap", "placebo")
         if variance_method not in valid_methods:
diff --git a/tests/test_methodology_sdid.py b/tests/test_methodology_sdid.py
index 5db1e6a2..2723e228 100644
--- a/tests/test_methodology_sdid.py
+++ b/tests/test_methodology_sdid.py
@@ -470,6 +470,16 @@ def test_bootstrap_se_positive(self, ci_params):
 class TestEdgeCases:
     """Edge case handling."""
 
+    def test_n_bootstrap_validation(self):
+        """n_bootstrap < 2 should raise ValueError."""
+        with pytest.raises(ValueError, match="n_bootstrap must be >= 2"):
+            SyntheticDiD(n_bootstrap=0)
+        with pytest.raises(ValueError, match="n_bootstrap must be >= 2"):
+            SyntheticDiD(n_bootstrap=1)
+        # n_bootstrap=2 should be accepted
+        sdid = SyntheticDiD(n_bootstrap=2)
+        assert sdid.n_bootstrap == 2
+
     def test_single_treated_unit(self, ci_params):
         """Estimation should work with a single treated unit."""
         df = _make_panel(n_control=10, n_treated=1, n_pre=5, n_post=2,

From ee5a1e46be84101b5f4b1c1e75f7510f3478e93f Mon Sep 17 00:00:00 2001
From: igerber <isaac.gerber@gmail.com>
Date: Tue, 10 Feb 2026 20:32:24 -0500
Subject: [PATCH 7/9] Filter non-finite tau in Python SDID paths and gate
 inference on finite SE
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Add np.isfinite(tau) guard in Python bootstrap and placebo loops to match
  Rust backend's tau.is_finite() filtering (sdid_variance.rs:220,391)
- Change `se > 0` to `np.isfinite(se) and se > 0` so se=inf produces NaN
  inference fields instead of misleading t_stat≈0 and spurious p-values
- Add regression tests for non-finite tau filtering and inf SE gating

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
---
 diff_diff/synthetic_did.py     | 10 ++--
 tests/test_methodology_sdid.py | 96 ++++++++++++++++++++++++++++++++++
 2 files changed, 102 insertions(+), 4 deletions(-)

diff --git a/diff_diff/synthetic_did.py b/diff_diff/synthetic_did.py
index fdb98740..2945949e 100644
--- a/diff_diff/synthetic_did.py
+++ b/diff_diff/synthetic_did.py
@@ -424,7 +424,7 @@ def fit(  # type: ignore[override]
             inference_method = "placebo"
 
         # Compute test statistics
-        if se > 0:
+        if np.isfinite(se) and se > 0:
             t_stat = att / se
             # Use placebo distribution for p-value if available
             if len(placebo_effects) > 0:
@@ -438,7 +438,7 @@ def fit(  # type: ignore[override]
             p_value = np.nan
 
         # Confidence interval
-        if se > 0:
+        if np.isfinite(se) and se > 0:
             conf_int = compute_confidence_interval(att, se, self.alpha)
         else:
             conf_int = (np.nan, np.nan)
@@ -676,7 +676,8 @@ def _bootstrap_se(
                     Y_boot_pre_t_mean, Y_boot_post_t_mean,
                     boot_omega, time_weights  # time_weights = original lambda
                 )
-                bootstrap_estimates.append(tau)
+                if np.isfinite(tau):
+                    bootstrap_estimates.append(tau)
 
             except (ValueError, LinAlgError):
                 continue
@@ -899,7 +900,8 @@ def _placebo_variance_se(
                     pseudo_omega,
                     pseudo_lambda
                 )
-                placebo_estimates.append(tau)
+                if np.isfinite(tau):
+                    placebo_estimates.append(tau)
 
             except (ValueError, LinAlgError, ZeroDivisionError):
                 # Skip failed iterations
diff --git a/tests/test_methodology_sdid.py b/tests/test_methodology_sdid.py
index 2723e228..ee544cc6 100644
--- a/tests/test_methodology_sdid.py
+++ b/tests/test_methodology_sdid.py
@@ -7,6 +7,7 @@
 """
 
 import warnings
+from unittest.mock import patch
 
 import numpy as np
 import pytest
@@ -530,6 +531,101 @@ def test_se_zero_propagation(self):
             assert np.isnan(results.conf_int[0])
             assert np.isnan(results.conf_int[1])
 
+    def test_nonfinite_tau_filtered_in_bootstrap(self):
+        """Non-finite tau values are filtered in Python bootstrap path (matches Rust)."""
+        call_count = [0]
+
+        def mock_estimator(*args, **kwargs):
+            call_count[0] += 1
+            if call_count[0] % 3 == 0:
+                return np.inf
+            return 1.0 + call_count[0] * 0.01
+
+        rng = np.random.default_rng(42)
+        n_pre, n_post, n_control, n_treated = 5, 2, 10, 3
+        Y_pre_c = rng.normal(size=(n_pre, n_control))
+        Y_post_c = rng.normal(size=(n_post, n_control))
+        Y_pre_t = rng.normal(size=(n_pre, n_treated))
+        Y_post_t = rng.normal(size=(n_post, n_treated))
+        unit_weights = np.ones(n_control) / n_control
+        time_weights = np.ones(n_pre) / n_pre
+
+        sdid = SyntheticDiD(n_bootstrap=20, seed=42)
+
+        with patch('diff_diff.synthetic_did.compute_sdid_estimator',
+                   side_effect=mock_estimator), \
+             patch('diff_diff._backend.HAS_RUST_BACKEND', False):
+            se, estimates = sdid._bootstrap_se(
+                Y_pre_c, Y_post_c, Y_pre_t, Y_post_t,
+                unit_weights, time_weights,
+            )
+
+        # All retained estimates must be finite (non-finite filtered out)
+        assert np.all(np.isfinite(estimates)), "Non-finite tau leaked into bootstrap estimates"
+        # Some estimates should have been filtered (every 3rd call returns inf)
+        assert len(estimates) < 20
+
+    def test_nonfinite_tau_filtered_in_placebo(self):
+        """Non-finite tau values are filtered in Python placebo path (matches Rust)."""
+        call_count = [0]
+
+        def mock_estimator(*args, **kwargs):
+            call_count[0] += 1
+            if call_count[0] % 3 == 0:
+                return np.nan
+            return 2.0 + call_count[0] * 0.01
+
+        rng = np.random.default_rng(42)
+        n_pre, n_post, n_control, n_treated = 5, 2, 15, 3
+        Y_pre_c = rng.normal(size=(n_pre, n_control))
+        Y_post_c = rng.normal(size=(n_post, n_control))
+        Y_pre_t_mean = rng.normal(size=(n_pre,))
+        Y_post_t_mean = rng.normal(size=(n_post,))
+        unit_weights = np.ones(n_control) / n_control
+        time_weights = np.ones(n_pre) / n_pre
+
+        sdid = SyntheticDiD(seed=42)
+
+        with patch('diff_diff.synthetic_did.compute_sdid_estimator',
+                   side_effect=mock_estimator), \
+             patch('diff_diff.synthetic_did.compute_sdid_unit_weights',
+                   return_value=np.ones(n_control - n_treated) / (n_control - n_treated)), \
+             patch('diff_diff.synthetic_did.compute_time_weights',
+                   return_value=np.ones(n_pre) / n_pre), \
+             patch('diff_diff._backend.HAS_RUST_BACKEND', False):
+            se, estimates = sdid._placebo_variance_se(
+                Y_pre_c, Y_post_c, Y_pre_t_mean, Y_post_t_mean,
+                unit_weights, time_weights,
+                n_treated=n_treated,
+                replications=20,
+            )
+
+        # All retained estimates must be finite (non-finite filtered out)
+        assert np.all(np.isfinite(estimates)), "Non-finite tau leaked into placebo estimates"
+        # Some estimates should have been filtered (every 3rd call returns nan)
+        assert len(estimates) < 20
+
+    def test_inf_se_produces_nan_inference(self):
+        """SE=inf should produce NaN t_stat, p_value, and CI."""
+        df = _make_panel(n_control=10, n_treated=3, n_pre=5, n_post=2, seed=42)
+        sdid = SyntheticDiD(variance_method="bootstrap", n_bootstrap=10, seed=42)
+
+        with patch.object(
+            SyntheticDiD, '_bootstrap_se',
+            return_value=(np.inf, np.array([1.0, 2.0, 3.0])),
+        ):
+            results = sdid.fit(
+                df, outcome="outcome", treatment="treated",
+                unit="unit", time="period",
+                post_periods=[5, 6],
+            )
+
+        assert results.se == np.inf
+        assert np.isnan(results.t_stat)
+        assert np.isnan(results.p_value)
+        assert np.isnan(results.conf_int[0])
+        assert np.isnan(results.conf_int[1])
+
 
 # =============================================================================
 # get_params / set_params

From 5da0999dca0553d777bd60b8b2c420e27918a8c3 Mon Sep 17 00:00:00 2001
From: igerber <isaac.gerber@gmail.com>
Date: Tue, 10 Feb 2026 20:51:21 -0500
Subject: [PATCH 8/9] Update SDID docs: replace deprecated lambda_reg and
 invalid n_bootstrap=0

Troubleshooting docs now use zeta_omega/zeta_lambda instead of deprecated
lambda_reg, and variance_method="placebo" instead of invalid n_bootstrap=0.
API autosummary removes lambda_reg and adds missing diagnostic fields.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
---
 docs/api/_autosummary/diff_diff.SyntheticDiDResults.rst | 6 +++++-
 docs/troubleshooting.rst                                | 6 +++---
 2 files changed, 8 insertions(+), 4 deletions(-)

diff --git a/docs/api/_autosummary/diff_diff.SyntheticDiDResults.rst b/docs/api/_autosummary/diff_diff.SyntheticDiDResults.rst
index 6e98446e..ef74b204 100644
--- a/docs/api/_autosummary/diff_diff.SyntheticDiDResults.rst
+++ b/docs/api/_autosummary/diff_diff.SyntheticDiDResults.rst
@@ -31,7 +31,6 @@
    
       ~SyntheticDiDResults.alpha
       ~SyntheticDiDResults.is_significant
-      ~SyntheticDiDResults.lambda_reg
       ~SyntheticDiDResults.placebo_effects
       ~SyntheticDiDResults.pre_treatment_fit
       ~SyntheticDiDResults.significance_stars
@@ -47,5 +46,10 @@
       ~SyntheticDiDResults.time_weights
       ~SyntheticDiDResults.pre_periods
       ~SyntheticDiDResults.post_periods
+      ~SyntheticDiDResults.variance_method
+      ~SyntheticDiDResults.noise_level
+      ~SyntheticDiDResults.zeta_omega
+      ~SyntheticDiDResults.zeta_lambda
+      ~SyntheticDiDResults.n_bootstrap
    
    
\ No newline at end of file
diff --git a/docs/troubleshooting.rst b/docs/troubleshooting.rst
index 19b86b93..d8aff499 100644
--- a/docs/troubleshooting.rst
+++ b/docs/troubleshooting.rst
@@ -84,7 +84,7 @@ Estimation Errors
    # Or use fewer fixed effects
 
    # For SyntheticDiD, increase regularization
-   sdid = SyntheticDiD(lambda_reg=1e-4)  # default is 1e-6
+   sdid = SyntheticDiD(zeta_omega=1e-4)  # increase unit weight regularization
 
 "Bootstrap iterations failed" warning
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
@@ -102,10 +102,10 @@ Estimation Errors
 .. code-block:: python
 
    # Increase regularization
-   sdid = SyntheticDiD(lambda_reg=1e-4, n_bootstrap=500)
+   sdid = SyntheticDiD(zeta_omega=1e-4, zeta_lambda=1e-4, n_bootstrap=500)
 
    # Or use placebo-based inference instead
-   sdid = SyntheticDiD(n_bootstrap=0)  # Uses placebo inference
+   sdid = SyntheticDiD(variance_method="placebo")  # Uses placebo inference
 
    # Ensure sufficient pre-treatment periods (recommend >= 4)
 

From e481aed1bcd377a2c8558aa3c4e4b0f0a3f8a670 Mon Sep 17 00:00:00 2001
From: igerber <isaac.gerber@gmail.com>
Date: Wed, 11 Feb 2026 06:31:42 -0500
Subject: [PATCH 9/9] Add bootstrap zeta-override test and remove unused
 placebo params

- Add test_bootstrap_with_zeta_overrides to cover bootstrap SE path
  with user-specified zeta_omega/zeta_lambda overrides (P1 coverage gap)
- Remove unused unit_weights/time_weights params from _placebo_variance_se
  signature, docstring, and call site (P3 cleanup)
- Update existing test that called _placebo_variance_se directly

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
---
 diff_diff/synthetic_did.py     |  8 --------
 tests/test_methodology_sdid.py | 22 +++++++++++++++++++---
 2 files changed, 19 insertions(+), 11 deletions(-)

diff --git a/diff_diff/synthetic_did.py b/diff_diff/synthetic_did.py
index 2945949e..47f01438 100644
--- a/diff_diff/synthetic_did.py
+++ b/diff_diff/synthetic_did.py
@@ -413,8 +413,6 @@ def fit(  # type: ignore[override]
                 Y_post_control,
                 Y_pre_treated_mean,
                 Y_post_treated_mean,
-                unit_weights,
-                time_weights,
                 n_treated=len(treated_units),
                 zeta_omega=zeta_omega,
                 zeta_lambda=zeta_lambda,
@@ -729,8 +727,6 @@ def _placebo_variance_se(
         Y_post_control: np.ndarray,
         Y_pre_treated_mean: np.ndarray,
         Y_post_treated_mean: np.ndarray,
-        unit_weights: np.ndarray,
-        time_weights: np.ndarray,
         n_treated: int,
         zeta_omega: float = 0.0,
         zeta_lambda: float = 0.0,
@@ -762,10 +758,6 @@ def _placebo_variance_se(
             Mean treated outcomes in pre-treatment periods, shape (n_pre,).
         Y_post_treated_mean : np.ndarray
             Mean treated outcomes in post-treatment periods, shape (n_post,).
-        unit_weights : np.ndarray
-            Original unit weights from main estimation, shape (n_control,).
-        time_weights : np.ndarray
-            Time weights from main estimation, shape (n_pre,).
         n_treated : int
             Number of treated units in the original estimation.
         zeta_omega : float
diff --git a/tests/test_methodology_sdid.py b/tests/test_methodology_sdid.py
index ee544cc6..3eb86645 100644
--- a/tests/test_methodology_sdid.py
+++ b/tests/test_methodology_sdid.py
@@ -462,6 +462,25 @@ def test_bootstrap_se_positive(self, ci_params):
         assert results.se > 0
         assert results.variance_method == "bootstrap"
 
+    def test_bootstrap_with_zeta_overrides(self, ci_params):
+        """Bootstrap SE should work with user-specified zeta overrides."""
+        df = _make_panel(n_control=20, n_treated=3, seed=42)
+        n_boot = ci_params.bootstrap(50)
+        sdid = SyntheticDiD(
+            variance_method="bootstrap", n_bootstrap=n_boot,
+            zeta_omega=99.0, zeta_lambda=0.5, seed=42,
+        )
+        results = sdid.fit(
+            df, outcome="outcome", treatment="treated",
+            unit="unit", time="period",
+            post_periods=list(range(5, 8)),
+        )
+
+        assert results.zeta_omega == 99.0
+        assert results.zeta_lambda == 0.5
+        assert results.variance_method == "bootstrap"
+        assert results.se > 0
+
 
 # =============================================================================
 # Edge Cases
@@ -581,8 +600,6 @@ def mock_estimator(*args, **kwargs):
         Y_post_c = rng.normal(size=(n_post, n_control))
         Y_pre_t_mean = rng.normal(size=(n_pre,))
         Y_post_t_mean = rng.normal(size=(n_post,))
-        unit_weights = np.ones(n_control) / n_control
-        time_weights = np.ones(n_pre) / n_pre
 
         sdid = SyntheticDiD(seed=42)
 
@@ -595,7 +612,6 @@ def mock_estimator(*args, **kwargs):
              patch('diff_diff._backend.HAS_RUST_BACKEND', False):
             se, estimates = sdid._placebo_variance_se(
                 Y_pre_c, Y_post_c, Y_pre_t_mean, Y_post_t_mean,
-                unit_weights, time_weights,
                 n_treated=n_treated,
                 replications=20,
             )