PSLmodels · donboyd5 · Feb 20, 2026 · Feb 18, 2026 · Feb 19, 2026 · Feb 19, 2026
diff --git a/tests/expected_tax_expenditures b/tests/expected_tax_expenditures
@@ -1,9 +1,9 @@
-YR,KIND,EST= 2023 paytax 1385.3
-YR,KIND,EST= 2023 iitax 2236.4
-YR,KIND,EST= 2023 ctc 128.8
-YR,KIND,EST= 2023 eitc 77.1
-YR,KIND,EST= 2023 social_security_partial_taxability 57.3
-YR,KIND,EST= 2023 niit -43.8
-YR,KIND,EST= 2023 cgqd_tax_preference 175.9
-YR,KIND,EST= 2023 qbid 52.3
-YR,KIND,EST= 2023 salt 20.8
+YR,KIND,EST= 2023 paytax 1381.8
+YR,KIND,EST= 2023 iitax 2237.2
+YR,KIND,EST= 2023 ctc 129.4
+YR,KIND,EST= 2023 eitc 77.8
+YR,KIND,EST= 2023 social_security_partial_taxability 57.5
+YR,KIND,EST= 2023 niit -43.6
+YR,KIND,EST= 2023 cgqd_tax_preference 174.4
+YR,KIND,EST= 2023 qbid 52.6
+YR,KIND,EST= 2023 salt 21.0
diff --git a/tests/test_imputed_variables.py b/tests/test_imputed_variables.py
@@ -41,9 +41,9 @@ def actual_results(rdf, bdf):
     deductions = {
         "OTM": {  # new OBBBA overtime income deduction
             "reform_dict": {"OvertimeIncomeDed_c": {simyear: [0, 0, 0, 0, 0]}},
-            "exp_totben": 23.88,
-            "exp_affpct": 8.83,
-            "exp_affben": 1406,
+            "exp_totben": 23.95,
+            "exp_affpct": 8.9,
+            "exp_affben": 1401,
             # The OTM imputation calibration parameters used in the
             # create_taxcalc_imputed_variables.py module were
             # specified so that the affpct statistic is close to 8.8%
@@ -55,9 +55,9 @@ def actual_results(rdf, bdf):
         },
         "TIP": {  # new OBBBA tip income deduction
             "reform_dict": {"TipIncomeDed_c": {simyear: 0}},
-            "exp_totben": 6.95,
-            "exp_affpct": 2.58,
-            "exp_affben": 1400,
+            "exp_totben": 6.93,
+            "exp_affpct": 2.61,
+            "exp_affben": 1380,
             # The TIP imputation calibration parameters used in the
             # create_taxcalc_imputed_variables.py module were
             # specified so that the affpct statistic is close to 2.6%
@@ -70,7 +70,7 @@ def actual_results(rdf, bdf):
         "ALI": {  # new OBBBA auto loan interest deduction
             "reform_dict": {"AutoLoanInterestDed_c": {simyear: 0}},
             "exp_totben": 1.73,
-            "exp_affpct": 10.29,
+            "exp_affpct": 10.28,
             "exp_affben": 87,
             # The ALI imputation calibration parameters used in the
             # create_taxcalc_imputed_variables.py module do not
@@ -86,9 +86,9 @@ def actual_results(rdf, bdf):
                 "AutoLoanInterestDed_c": {simyear: 0},
                 "SeniorDed_c": {simyear: 0},
             },
-            "exp_totben": 55.01,
-            "exp_affpct": 28.04,
-            "exp_affben": 1020,
+            "exp_totben": 54.86,
+            "exp_affpct": 28.06,
+            "exp_affben": 1018,
             # The affpct statistic of 28.04% and the affben statistic
             # of $1020 are reasonably close to the Tax Policy Center
             # estimates of 29.6% and $1081, respectively, as reported at
@@ -127,21 +127,11 @@ def actual_results(rdf, bdf):
         # tabulate act results
         act_res = actual_results(rdf, bdf)
         # compare act results with exp results for each statistic
-        tolerance = {
-            "totben": {"abs": 0.01, "rel": 0.0015},
-            "affpct": {"abs": 0.01, "rel": 0.0001},
-            "affben": {"abs": 1.00, "rel": 0.0000},
-        }
         for stat in ["totben", "affpct", "affben"]:
             act = act_res[stat]
             exp = info[f"exp_{stat}"]
-            a_tol = tolerance[stat]["abs"]
-            r_tol = tolerance[stat]["rel"]
-            if not np.allclose([act], [exp], atol=a_tol, rtol=r_tol):
-                diff = (
-                    f"DIFF:{ded},{stat},act,exp,atol,rtol= "
-                    f"{act} {exp} {a_tol} {r_tol}"
-                )
+            if not np.allclose([act], [exp]):
+                diff = f"DIFF:{ded},{stat},act,exp= {act} {exp}"
                 diffs.append(diff)
         # delete reform Policy and Calculator objects
         del reform_policy
@@ -160,14 +150,15 @@ def test_imputed_variable_distribution(tmd_variables):
     """
     imputed_var_names = ["overtime_income", "tip_income", "auto_loan_interest"]
     expect = {
-        "overtime_income": {"mean": 10_761, "sdev": 270_629},
-        "tip_income": {"mean": 1_606, "sdev": 95_550},
-        "auto_loan_interest": {"mean": 116, "sdev": 354},
-    }
-    tolerance = {
-        "overtime_income": 0.001,
-        "tip_income": 0.001,
-        "auto_loan_interest": 0.004,
+        "overtime_income": {
+            "mean": 10761.07964271762,
+            "sdev": 270629.2735673272,
+        },
+        "tip_income": {"mean": 1606.104987214547, "sdev": 95550.08249632413},
+        "auto_loan_interest": {
+            "mean": 116.41451060127145,
+            "sdev": 354.21466485958564,
+        },
     }
     diffs = []
     for ivname in imputed_var_names:
@@ -179,12 +170,10 @@ def test_imputed_variable_distribution(tmd_variables):
         for stat in ["mean", "sdev"]:
             act = actual[stat]
             exp = expect[ivname][stat]
-            abstol = 0.0
-            reltol = tolerance[ivname]
-            if not np.allclose([act], [exp], atol=abstol, rtol=reltol):
+            if not np.allclose([act], [exp]):
                 diff = (
-                    f"IMPUTED_VAR_DIFF:{ivname},{stat},act,exp,atol,rtol= "
-                    f"{act} {exp} {abstol} {reltol}"
+                    f"IMPUTED_VAR_DIFF:{ivname},{stat},act,exp= "
+                    f"{act} {exp}"
                 )
                 diffs.append(diff)
     if diffs:

diff --git a/tests/test_reweight.py b/tests/test_reweight.py
@@ -0,0 +1,77 @@
+"""
+Unit tests for tmd/utils/reweight.py helper functions.
+"""
+
+import warnings
+import numpy as np
+import pandas as pd
+import pytest
+from tmd.storage import STORAGE_FOLDER
+from tmd.utils.reweight import _drop_impossible_targets, build_loss_matrix
+
+
+def test_drop_impossible_targets_removes_all_zero_column():
+    """All-zero columns are impossible targets: dropped with a UserWarning."""
+    loss_matrix = pd.DataFrame(
+        {
+            "good_a": [1.0, 2.0, 0.0],
+            "bad_zero": [0.0, 0.0, 0.0],
+            "good_b": [0.0, 3.0, 1.0],
+        }
+    )
+    targets_arr = np.array([100.0, 50.0, 200.0])
+    with pytest.warns(UserWarning, match="bad_zero"):
+        result_matrix, result_targets = _drop_impossible_targets(
+            loss_matrix, targets_arr
+        )
+    assert "bad_zero" not in result_matrix.columns
+    assert list(result_matrix.columns) == ["good_a", "good_b"]
+    np.testing.assert_array_equal(result_targets, [100.0, 200.0])
+
+
+def test_drop_impossible_targets_keeps_all_when_none_zero():
+    """No columns are dropped when none are all-zero."""
+    loss_matrix = pd.DataFrame(
+        {
+            "a": [1.0, 2.0],
+            "b": [3.0, 4.0],
+        }
+    )
+    targets_arr = np.array([10.0, 20.0])
+    result_matrix, result_targets = _drop_impossible_targets(
+        loss_matrix, targets_arr
+    )
+    assert list(result_matrix.columns) == ["a", "b"]
+    np.testing.assert_array_equal(result_targets, [10.0, 20.0])
+
+
+def test_drop_impossible_targets_column_with_single_nonzero_is_kept():
+    """A column with at least one nonzero value is not impossible."""
+    loss_matrix = pd.DataFrame(
+        {
+            "almost_zero": [0.0, 0.0, 1e-10],
+        }
+    )
+    targets_arr = np.array([5.0])
+    result_matrix, result_targets = _drop_impossible_targets(
+        loss_matrix, targets_arr
+    )
+    assert "almost_zero" in result_matrix.columns
+    assert len(result_targets) == 1
+
+
+def test_no_all_zero_columns_in_real_loss_matrix(tmd_variables):
+    """The real loss matrix must have no all-zero columns.
+
+    All-zero columns mean no reweighting can hit the target.
+    This is a data problem that must be fixed upstream, not
+    silently filtered out at optimization time.
+    """
+    targets = pd.read_csv(STORAGE_FOLDER / "input" / "soi.csv")
+
+    with warnings.catch_warnings(record=True) as caught:
+        warnings.simplefilter("always")
+        build_loss_matrix(tmd_variables, targets, 2021)
+    impossible = [w for w in caught if "impossible targets" in str(w.message)]
+    if impossible:
+        raise AssertionError(str(impossible[0].message))
diff --git a/tests/test_tax_expenditures.py b/tests/test_tax_expenditures.py
@@ -33,10 +33,9 @@ def test_tax_exp_diffs(
     assert actdf.shape == expdf.shape, "actdf and expdf are not the same shape"
     # compare actdf and expdf rows
     same = True
-    # define relative diff tolerance
     actval = actdf.iloc[:, 3].to_numpy(dtype=np.float64)
     expval = expdf.iloc[:, 3].to_numpy(dtype=np.float64)
-    if not np.allclose(actval, expval, atol=0.0, rtol=0.002):
+    if not np.allclose(actval, expval):
         same = False
     if same:
         return

diff --git a/tests/test_variable_totals.py b/tests/test_variable_totals.py
@@ -9,6 +9,7 @@
 from tmd.storage import STORAGE_FOLDER
 
 
+@pytest.mark.skip(reason="See issue #410: expected values need updating")
 @pytest.mark.vartotals
 def test_variable_totals(tests_folder, tmd_variables):
     vpath = STORAGE_FOLDER / "input" / "tc_variable_metadata.yaml"

diff --git a/tests/test_weights.py b/tests/test_weights.py
@@ -13,19 +13,13 @@ def test_weights(tmd_variables):
     """
     wght = tmd_variables["s006"].to_numpy()
     actual = {"mean": wght.mean(), "sdev": wght.std()}
-    expect = {"mean": 816.06972, "sdev": 1142.57270}
-    tolerance = {"mean": 0.0015, "sdev": 0.0005}
+    expect = {"mean": 815.5521277934885, "sdev": 961.7270821801824}
     diffs = []
     for stat in ["mean", "sdev"]:
         act = actual[stat]
         exp = expect[stat]
-        abstol = 0.0
-        reltol = tolerance[stat]
-        if not np.allclose([act], [exp], atol=abstol, rtol=reltol):
-            diff = (
-                f"WEIGHT_DIFF:{stat},act,exp,atol,rtol= "
-                f"{act} {exp} {abstol} {reltol}"
-            )
+        if not np.allclose([act], [exp]):
+            diff = f"WEIGHT_DIFF:{stat},act,exp= {act} {exp}"
             diffs.append(diff)
     if diffs:
         emsg = "\nWEIGHT VARIABLE ACT-vs-EXP DIFFS:"

diff --git a/tmd/datasets/tmd.py b/tmd/datasets/tmd.py
@@ -1,3 +1,6 @@
+import sys
+import subprocess
+import tempfile
 import numpy as np
 import pandas as pd
 from policyengine_us import Microsimulation
@@ -7,7 +10,6 @@
 from tmd.datasets.taxcalc_dataset import create_tc_dataset
 from tmd.utils.trace import trace1
 from tmd.utils.taxcalc_utils import add_taxcalc_outputs
-from tmd.utils.reweight import reweight
 
 
 def create_tmd_2021():
@@ -38,15 +40,41 @@ def create_tmd_2021():
     # ... drop CPS records with positive 2021 income tax amount
     idx = combined[((combined.data_source == 0) & (combined.iitax > 0))].index
     combined.drop(idx, inplace=True)
-    # ... scale CPS records weight in order to get correct population count
+    # ... scale CPS records weight to get correct population count
     scale = np.where(combined.data_source == 0, CPS_WEIGHTS_SCALE, 1.0)
     combined["s006"] *= scale
 
     trace1("B", combined)
 
     print("Reweighting...")
     combined["s006_original"] = combined["s006"].values
-    combined = reweight(combined, 2021)
+    # Run reweighting in a subprocess so that prior PyTorch
+    # operations (PolicyEngine Microsimulation) don't affect
+    # gradient computation. Without this, autograd accumulation
+    # order differs at machine epsilon, which compounds over
+    # many optimizer iterations on the flat loss surface.
+    with tempfile.TemporaryDirectory() as tmpdir:
+        snapshot_path = f"{tmpdir}/snapshot.csv.gz"
+        result_path = f"{tmpdir}/result.csv.gz"
+        combined.to_csv(snapshot_path, index=False)
+        subprocess.run(
+            [
+                sys.executable,
+                "-c",
+                "import pandas as pd; "
+                "import sys; sys.path.insert(0, '.'); "
+                "from tmd.utils.reweight import reweight; "
+                f"df = pd.read_csv('{snapshot_path}'); "
+                "df = reweight(df, 2021); "
+                f"df[['RECID','s006']].to_csv("
+                f"'{result_path}', index=False)",
+            ],
+            check=True,
+        )
+        reweighted = pd.read_csv(result_path)
+    combined["s006"] = combined.merge(
+        reweighted, on="RECID", suffixes=("_old", "")
+    )["s006"].values
 
     trace1("C", combined)
 

diff --git a/tmd/imputation_assumptions.py b/tmd/imputation_assumptions.py
@@ -16,6 +16,7 @@
 # parameters used in creation of national sampling weights:
 REWEIGHT_MULTIPLIER_MIN = 0.1
 REWEIGHT_MULTIPLIER_MAX = 10.0
-REWEIGHT_DEVIATION_PENALTY = 0.0
+REWEIGHT_DEVIATION_PENALTY = 0.01
 # penalty value of 1.0 says "this is as important as everything else"
 # penalty value of 0.0 imposes no penalty
+# uses L2 norm: sum((new - original)^2) / sum(original^2)