From 3f6e0b93076c4ddf60671639864770ef1841852b Mon Sep 17 00:00:00 2001
From: David Trimmer <david@policyengine.org>
Date: Thu, 26 Feb 2026 15:00:43 -0500
Subject: [PATCH 01/12] Add South Carolina dataset exploration

Adds data exploration notebook and summary CSV for South Carolina (SC) dataset:
- Household and person counts (weighted)
- AGI distribution (median, average, percentiles) at household and person level
- Households with children breakdown
- Children by age group demographics
- Income bracket analysis

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 us/states/sc/data_exploration.ipynb          | 290 +++++++++++++++++++
 us/states/sc/sc_dataset_summary_weighted.csv |  22 ++
 2 files changed, 312 insertions(+)
 create mode 100644 us/states/sc/data_exploration.ipynb
 create mode 100644 us/states/sc/sc_dataset_summary_weighted.csv

diff --git a/us/states/sc/data_exploration.ipynb b/us/states/sc/data_exploration.ipynb
new file mode 100644
index 0000000..09787fd
--- /dev/null
+++ b/us/states/sc/data_exploration.ipynb
@@ -0,0 +1,290 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# SC Dataset Exploration\n",
+    "\n",
+    "This notebook explores the South Carolina (SC) dataset to understand household counts, income distribution, and demographic characteristics."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from policyengine_us import Microsimulation\n",
+    "import pandas as pd\n",
+    "import numpy as np\n",
+    "\n",
+    "SC_DATASET = \"hf://policyengine/policyengine-us-data/states/SC.h5\""
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Load SC dataset\n",
+    "sim = Microsimulation(dataset=SC_DATASET)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Number of households in dataset: 35,324\n",
+      "Household count (weighted): 1,887,388\n",
+      "Person count (weighted): 5,451,832\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Check dataset size\n",
+    "household_weight = sim.calculate(\"household_weight\", period=2025)\n",
+    "household_count = sim.calculate(\"household_count\", period=2025, map_to=\"household\")\n",
+    "person_count = sim.calculate(\"person_count\", period=2025, map_to=\"household\")\n",
+    "\n",
+    "print(f\"Number of households in dataset: {len(household_weight):,}\")\n",
+    "print(f\"Household count (weighted): {household_count.sum():,.0f}\")\n",
+    "print(f\"Person count (weighted): {person_count.sum():,.0f}\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": "# Check income distribution (weighted vs unweighted, household and person level)\nagi_household = sim.calculate(\"adjusted_gross_income\", period=2025, map_to=\"household\")\nagi_hh_array = np.array(agi_household)\nhh_weights = np.array(sim.calculate(\"household_weight\", period=2025))\n\nagi_person = sim.calculate(\"adjusted_gross_income\", period=2025, map_to=\"person\")\nagi_person_array = np.array(agi_person)\nperson_weights = np.array(sim.calculate(\"person_weight\", period=2025))\n\n# Weighted percentile calculation\ndef weighted_percentile(values, weights, percentile):\n    sorted_indices = np.argsort(values)\n    sorted_values = values[sorted_indices]\n    sorted_weights = weights[sorted_indices]\n    cumulative_weight = np.cumsum(sorted_weights)\n    idx = np.searchsorted(cumulative_weight, cumulative_weight[-1] * percentile / 100)\n    return sorted_values[min(idx, len(sorted_values)-1)]\n\n# Unweighted medians\nunweighted_median_hh = np.median(agi_hh_array)\nunweighted_median_person = np.median(agi_person_array)\n\n# Weighted medians\nweighted_median_hh = weighted_percentile(agi_hh_array, hh_weights, 50)\nweighted_median_person = weighted_percentile(agi_person_array, person_weights, 50)\n\n# Weighted averages\nweighted_avg_hh = np.average(agi_hh_array, weights=hh_weights)\nweighted_avg_person = np.average(agi_person_array, weights=person_weights)\n\n# Average household size\ntotal_persons = person_weights.sum()\ntotal_households = hh_weights.sum()\navg_hh_size = total_persons / total_households\n\nprint(\"=\" * 60)\nprint(\"INCOME DISTRIBUTION SUMMARY\")\nprint(\"=\" * 60)\nprint(f\"\\nHousehold AGI:\")\nprint(f\"  Unweighted median: ${unweighted_median_hh:,.0f}\")\nprint(f\"  Weighted median:   ${weighted_median_hh:,.0f}\")\nprint(f\"  Weighted average:  ${weighted_avg_hh:,.0f}\")\n\nprint(f\"\\nPerson AGI:\")\nprint(f\"  Unweighted median: ${unweighted_median_person:,.0f}\")\nprint(f\"  Weighted median:   ${weighted_median_person:,.0f}\")\nprint(f\"  Weighted average:  ${weighted_avg_person:,.0f}\")\n\nprint(f\"\\nAverage household size: {avg_hh_size:.1f}\")\n\nprint(f\"\\nWeighted household AGI percentiles:\")\nprint(f\"  25th percentile: ${weighted_percentile(agi_hh_array, hh_weights, 25):,.0f}\")\nprint(f\"  50th percentile: ${weighted_percentile(agi_hh_array, hh_weights, 50):,.0f}\")\nprint(f\"  75th percentile: ${weighted_percentile(agi_hh_array, hh_weights, 75):,.0f}\")\nprint(f\"  90th percentile: ${weighted_percentile(agi_hh_array, hh_weights, 90):,.0f}\")\nprint(f\"  95th percentile: ${weighted_percentile(agi_hh_array, hh_weights, 95):,.0f}\")\nprint(f\"  Max AGI: ${agi_hh_array.max():,.0f}\")"
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "Households with children (weighted):\n",
+      "  Total households with children: 598,564\n",
+      "  Households with 1 child: 247,956\n",
+      "  Households with 2 children: 190,545\n",
+      "  Households with 3+ children: 160,063\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Check households with children\n",
+    "is_child = sim.calculate(\"is_child\", period=2025, map_to=\"person\")\n",
+    "household_id = sim.calculate(\"household_id\", period=2025, map_to=\"person\")\n",
+    "household_weight = sim.calculate(\"household_weight\", period=2025, map_to=\"person\")\n",
+    "\n",
+    "# Create DataFrame\n",
+    "df_households = pd.DataFrame({\n",
+    "    'household_id': household_id,\n",
+    "    'is_child': is_child,\n",
+    "    'household_weight': household_weight\n",
+    "})\n",
+    "\n",
+    "# Count children per household\n",
+    "children_per_household = df_households.groupby('household_id').agg({\n",
+    "    'is_child': 'sum',\n",
+    "    'household_weight': 'first'\n",
+    "}).reset_index()\n",
+    "\n",
+    "# Calculate weighted household counts\n",
+    "total_households_with_children = children_per_household[children_per_household['is_child'] > 0]['household_weight'].sum()\n",
+    "households_with_1_child = children_per_household[children_per_household['is_child'] == 1]['household_weight'].sum()\n",
+    "households_with_2_children = children_per_household[children_per_household['is_child'] == 2]['household_weight'].sum()\n",
+    "households_with_3plus_children = children_per_household[children_per_household['is_child'] >= 3]['household_weight'].sum()\n",
+    "\n",
+    "print(f\"\\nHouseholds with children (weighted):\")\n",
+    "print(f\"  Total households with children: {total_households_with_children:,.0f}\")\n",
+    "print(f\"  Households with 1 child: {households_with_1_child:,.0f}\")\n",
+    "print(f\"  Households with 2 children: {households_with_2_children:,.0f}\")\n",
+    "print(f\"  Households with 3+ children: {households_with_3plus_children:,.0f}\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "Children by age:\n",
+      "  Total children under 18: 1,198,147\n",
+      "  Children under 6: 349,101\n",
+      "  Children under 3: 169,412\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Check children by age groups\n",
+    "df = pd.DataFrame({\n",
+    "    \"household_id\": sim.calculate(\"household_id\", map_to=\"person\"),\n",
+    "    \"tax_unit_id\": sim.calculate(\"tax_unit_id\", map_to=\"person\"),\n",
+    "    \"person_id\": sim.calculate(\"person_id\", map_to=\"person\"),\n",
+    "    \"age\": sim.calculate(\"age\", map_to=\"person\"),\n",
+    "    \"person_weight\": sim.calculate(\"person_weight\", map_to=\"person\")\n",
+    "})\n",
+    "\n",
+    "# Filter for children and apply weights\n",
+    "children_under_18_df = df[df['age'] < 18]\n",
+    "children_under_6_df = df[df['age'] < 6]\n",
+    "children_under_3_df = df[df['age'] < 3]\n",
+    "\n",
+    "# Calculate weighted totals\n",
+    "total_children = children_under_18_df['person_weight'].sum()\n",
+    "children_under_6 = children_under_6_df['person_weight'].sum()\n",
+    "children_under_3 = children_under_3_df['person_weight'].sum()\n",
+    "\n",
+    "print(f\"\\nChildren by age:\")\n",
+    "print(f\"  Total children under 18: {total_children:,.0f}\")\n",
+    "print(f\"  Children under 6: {children_under_6:,.0f}\")\n",
+    "print(f\"  Children under 3: {children_under_3:,.0f}\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": "# Create comprehensive summary table\nsummary_data = {\n    'Metric': [\n        'Household count (weighted)',\n        'Person count (weighted)',\n        'Average household size',\n        'Weighted median household AGI',\n        'Weighted average household AGI',\n        'Weighted median person AGI',\n        'Weighted average person AGI',\n        'Unweighted median household AGI',\n        'Unweighted median person AGI',\n        '25th percentile household AGI',\n        '75th percentile household AGI',\n        '90th percentile household AGI',\n        '95th percentile household AGI',\n        'Max household AGI',\n        'Total households with children',\n        'Households with 1 child',\n        'Households with 2 children',\n        'Households with 3+ children',\n        'Total children under 18',\n        'Children under 6',\n        'Children under 3'\n    ],\n    'Value': [\n        f\"{household_count.sum():,.0f}\",\n        f\"{person_count.sum():,.0f}\",\n        f\"{avg_hh_size:.1f}\",\n        f\"${weighted_median_hh:,.0f}\",\n        f\"${weighted_avg_hh:,.0f}\",\n        f\"${weighted_median_person:,.0f}\",\n        f\"${weighted_avg_person:,.0f}\",\n        f\"${unweighted_median_hh:,.0f}\",\n        f\"${unweighted_median_person:,.0f}\",\n        f\"${weighted_percentile(agi_hh_array, hh_weights, 25):,.0f}\",\n        f\"${weighted_percentile(agi_hh_array, hh_weights, 75):,.0f}\",\n        f\"${weighted_percentile(agi_hh_array, hh_weights, 90):,.0f}\",\n        f\"${weighted_percentile(agi_hh_array, hh_weights, 95):,.0f}\",\n        f\"${agi_hh_array.max():,.0f}\",\n        f\"{total_households_with_children:,.0f}\",\n        f\"{households_with_1_child:,.0f}\",\n        f\"{households_with_2_children:,.0f}\",\n        f\"{households_with_3plus_children:,.0f}\",\n        f\"{total_children:,.0f}\",\n        f\"{children_under_6:,.0f}\",\n        f\"{children_under_3:,.0f}\"\n    ]\n}\n\nsummary_df = pd.DataFrame(summary_data)\n\nprint(\"\\n\" + \"=\"*65)\nprint(\"SC DATASET SUMMARY - WEIGHTED (Population Estimates)\")\nprint(\"=\"*65)\nprint(summary_df.to_string(index=False))\nprint(\"=\"*65)\n\n# Save table\nsummary_df.to_csv('sc_dataset_summary_weighted.csv', index=False)\nprint(\"\\nSummary saved to: sc_dataset_summary_weighted.csv\")"
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "======================================================================\n",
+      "HOUSEHOLDS WITH $0 INCOME\n",
+      "======================================================================\n",
+      "Household count: 179,119\n",
+      "Percentage of all households: 9.49%\n",
+      "======================================================================\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Households with $0 income\n",
+    "agi_hh = np.array(sim.calculate(\"adjusted_gross_income\", period=2025, map_to=\"household\"))\n",
+    "weights = np.array(sim.calculate(\"household_weight\", period=2025))\n",
+    "\n",
+    "zero_income_mask = agi_hh == 0\n",
+    "zero_income_count = weights[zero_income_mask].sum()\n",
+    "total_households = weights.sum()\n",
+    "\n",
+    "print(\"\\n\" + \"=\"*70)\n",
+    "print(\"HOUSEHOLDS WITH $0 INCOME\")\n",
+    "print(\"=\"*70)\n",
+    "print(f\"Household count: {zero_income_count:,.0f}\")\n",
+    "print(f\"Percentage of all households: {zero_income_count / total_households * 100:.2f}%\")\n",
+    "print(\"=\"*70)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "======================================================================\n",
+      "HOUSEHOLD COUNTS BY INCOME BRACKET\n",
+      "======================================================================\n",
+      "Income Bracket Households % of All Households\n",
+      "       $0-$10k    434,505              23.02%\n",
+      "     $10k-$20k    155,370               8.23%\n",
+      "     $20k-$30k    149,595               7.93%\n",
+      "     $30k-$40k    115,365               6.11%\n",
+      "     $40k-$50k    127,566               6.76%\n",
+      "     $50k-$60k    110,405               5.85%\n",
+      "======================================================================\n",
+      "\n",
+      "Total households in $0-$60k range: 1,092,805\n",
+      "Percentage of all households in $0-$60k range: 57.90%\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Household counts by income brackets\n",
+    "income_brackets = [\n",
+    "    (0, 10000, \"$0-$10k\"),\n",
+    "    (10000, 20000, \"$10k-$20k\"),\n",
+    "    (20000, 30000, \"$20k-$30k\"),\n",
+    "    (30000, 40000, \"$30k-$40k\"),\n",
+    "    (40000, 50000, \"$40k-$50k\"),\n",
+    "    (50000, 60000, \"$50k-$60k\")\n",
+    "]\n",
+    "\n",
+    "bracket_data = []\n",
+    "for lower, upper, label in income_brackets:\n",
+    "    mask = (agi_hh >= lower) & (agi_hh < upper)\n",
+    "    count = weights[mask].sum()\n",
+    "    pct_of_total = (count / total_households) * 100\n",
+    "    \n",
+    "    bracket_data.append({\n",
+    "        \"Income Bracket\": label,\n",
+    "        \"Households\": f\"{count:,.0f}\",\n",
+    "        \"% of All Households\": f\"{pct_of_total:.2f}%\"\n",
+    "    })\n",
+    "\n",
+    "income_df = pd.DataFrame(bracket_data)\n",
+    "\n",
+    "print(\"\\n\" + \"=\"*70)\n",
+    "print(\"HOUSEHOLD COUNTS BY INCOME BRACKET\")\n",
+    "print(\"=\"*70)\n",
+    "print(income_df.to_string(index=False))\n",
+    "print(\"=\"*70)\n",
+    "\n",
+    "# Total in $0-$60k range\n",
+    "total_in_range = sum([weights[(agi_hh >= lower) & (agi_hh < upper)].sum() for lower, upper, _ in income_brackets])\n",
+    "print(f\"\\nTotal households in $0-$60k range: {total_in_range:,.0f}\")\n",
+    "print(f\"Percentage of all households in $0-$60k range: {total_in_range / total_households * 100:.2f}%\")"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.11.5"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 4
+}
\ No newline at end of file
diff --git a/us/states/sc/sc_dataset_summary_weighted.csv b/us/states/sc/sc_dataset_summary_weighted.csv
new file mode 100644
index 0000000..6ff9465
--- /dev/null
+++ b/us/states/sc/sc_dataset_summary_weighted.csv
@@ -0,0 +1,22 @@
+Metric,Value
+Household count (weighted),"1,887,388"
+Person count (weighted),"5,451,832"
+Average household size,2.9
+Weighted median household AGI,"$43,222"
+Weighted average household AGI,"$103,858"
+Weighted median person AGI,"$38,962"
+Weighted average person AGI,"$93,926"
+Unweighted median household AGI,"$41,884"
+Unweighted median person AGI,"$40,216"
+25th percentile household AGI,"$9,425"
+75th percentile household AGI,"$91,877"
+90th percentile household AGI,"$167,068"
+95th percentile household AGI,"$268,311"
+Max household AGI,"$6,430,892"
+Total households with children,"598,564"
+Households with 1 child,"247,956"
+Households with 2 children,"190,545"
+Households with 3+ children,"160,063"
+Total children under 18,"1,198,147"
+Children under 6,"349,101"
+Children under 3,"169,412"

From 7022250279c8c7b0c137b56f7e6e531706f1d8aa Mon Sep 17 00:00:00 2001
From: David Trimmer <david@policyengine.org>
Date: Thu, 26 Feb 2026 16:03:28 -0500
Subject: [PATCH 02/12] Add SC H.4216 tax reform analysis and RFA comparison

- Add H.4216 reform analysis notebook using PolicyEngine microsimulation
- Include RFA official analysis data for comparison
- Add detailed comparison markdown explaining $159M difference:
  - PE shows +$40M revenue vs RFA's -$119M
  - Key difference: SCIAD phase-out treatment for upper-middle income
  - Implementation uses AGI - SCIAD vs federal taxable income

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 us/states/sc/h4216_analysis_comparison.md     | 121 +++++
 us/states/sc/rfa_h4216_analysis.csv           |  16 +
 us/states/sc/sc_h4216_reform_analysis.ipynb   | 418 ++++++++++++++++++
 us/states/sc/sc_h4216_tax_impact_analysis.csv |  16 +
 4 files changed, 571 insertions(+)
 create mode 100644 us/states/sc/h4216_analysis_comparison.md
 create mode 100644 us/states/sc/rfa_h4216_analysis.csv
 create mode 100644 us/states/sc/sc_h4216_reform_analysis.ipynb
 create mode 100644 us/states/sc/sc_h4216_tax_impact_analysis.csv

diff --git a/us/states/sc/h4216_analysis_comparison.md b/us/states/sc/h4216_analysis_comparison.md
new file mode 100644
index 0000000..294ca6e
--- /dev/null
+++ b/us/states/sc/h4216_analysis_comparison.md
@@ -0,0 +1,121 @@
+# SC H.4216 Analysis Comparison: PolicyEngine vs RFA
+
+## Summary
+
+| Metric | RFA | PolicyEngine | Difference |
+|--------|-----|--------------|------------|
+| **General Fund Impact** | **-$119.1M** | **+$39.8M** | **+$158.9M** |
+| Total Returns | 2,757,573 | 2,935,621 | +178,048 |
+| Tax Decrease % | 38.7% | 20.0% | -18.7pp |
+| Tax Increase % | 26.7% | 24.0% | -2.7pp |
+| No Change % | 34.6% | 56.0% | +21.4pp |
+
+## Top 5 Discrepancies by Income Bracket
+
+| AGI Range | RFA Impact | PE Impact | Difference |
+|-----------|------------|-----------|------------|
+| Over $1,000,000 | -$13.8M | -$115.3M | -$101.5M |
+| $50,001-$75,000 | -$82.1M | -$23.3M | +$58.9M |
+| $100,001-$150,000 | +$3.1M | +$53.4M | +$50.3M |
+| $300,001-$500,000 | -$4.6M | +$40.6M | +$45.3M |
+| $500,001-$1,000,000 | -$16.2M | +$18.7M | +$34.9M |
+
+## Key Differences Explaining the $159M Gap
+
+### 1. Upper-Middle Income ($100k-$500k): PE Shows Much Larger Tax Increases
+
+| Bracket | RFA Avg Change | PE Avg Change | Direction |
+|---------|----------------|---------------|-----------|
+| $100k-$150k | +$11 | +$284 | Both increase, PE 25x larger |
+| $150k-$200k | +$355 | +$727 | Both increase, PE 2x larger |
+| $300k-$500k | **-$82** | **+$1,099** | RFA: decrease, PE: increase |
+| $500k-$1M | **-$631** | **+$1,129** | RFA: decrease, PE: increase |
+
+**This is the primary driver of the difference.** PolicyEngine shows significant tax INCREASES in the $100k-$500k range where RFA shows small increases or even decreases.
+
+### 2. Middle Income ($30k-$100k): PE Shows Smaller Tax Cuts
+
+| Bracket | RFA Avg Change | PE Avg Change |
+|---------|----------------|---------------|
+| $30k-$40k | -$72 | -$23 |
+| $40k-$50k | -$179 | -$135 |
+| $50k-$75k | -$202 | -$77 |
+| $75k-$100k | -$146 | -$71 |
+
+RFA shows 2-3x larger tax cuts in these brackets.
+
+### 3. Over $1M: PE Shows Much Larger Tax Cuts
+
+| Metric | RFA | PE |
+|--------|-----|-----|
+| Avg Change | -$1,154 | -$5,082 |
+| Total Impact | -$13.8M | -$115.3M |
+
+PE shows 4-8x larger tax cuts for millionaires, but with more returns (22,686 vs 11,936).
+
+### 4. Low Income ($0-$30k): Different Tax Bases
+
+RFA shows existing tax liability for low-income filers ($50, $3, $16, $107 avg), while PE shows $0 for most low-income brackets. This suggests:
+- Different baseline calculations
+- Different treatment of non-filers
+- CPS data may underrepresent low-income tax filers
+
+## Likely Causes
+
+### 1. Implementation Details (from PR #7494)
+
+**Baseline SC Taxable Income:**
+```python
+taxable_income = federal_taxable_income + sc_additions - sc_subtractions
+```
+Where `federal_taxable_income` = AGI - standard/itemized deduction - QBI deduction
+
+**H.4216 SC Taxable Income:**
+```python
+taxable_income = AGI + sc_additions - sc_subtractions - SCIAD
+```
+Where SCIAD phases out from $40k-$190k AGI (varies by filing status)
+
+**Key Insight**: The reform switches from using federal taxable income (after federal deductions) to using AGI minus SCIAD. For taxpayers who itemize large deductions or have QBI deductions, this could result in HIGHER taxable income under H.4216.
+
+### 2. SCIAD Phase-out Creates Winners and Losers
+
+| Filing Status | SCIAD Amount | Phase-out Start | Phase-out End |
+|---------------|--------------|-----------------|---------------|
+| Single | $15,000 | $40,000 | $95,000 |
+| MFJ | $30,000 | $80,000 | $190,000 |
+| HoH | $22,500 | $60,000 | $142,500 |
+
+For taxpayers above phase-out thresholds with SCIAD = $0:
+- If their federal deduction was > $0, they lose that deduction entirely
+- This explains why PE shows large tax INCREASES for $100k-$500k brackets
+
+### 3. Baseline Tax Differences
+PE baseline avg tax ($2,220) is lower than RFA ($2,321), suggesting different starting points for current law calculations.
+
+### 4. Data Source Differences
+- **RFA**: SC Department of Revenue 2024 tax returns (95% sample, inflated to 100%)
+- **PE**: CPS-based synthetic data for South Carolina
+
+Tax return data captures actual filers with precise income/deduction information. CPS-based data may:
+- Over/underrepresent certain income groups
+- Miss nuances in itemized vs standard deduction usage
+- Have different filing status distributions
+
+### 5. Federal Deduction Treatment
+H.4216 eliminates federal standard/itemized deductions. The impact depends heavily on:
+- Current deduction amounts by income level
+- How many taxpayers itemize vs take standard deduction
+- QBI deduction amounts (not replaced by SCIAD)
+
+RFA has actual deduction data; PE estimates from CPS.
+
+## Net Effect
+
+The $159M difference primarily comes from:
+1. **+$140M**: PE shows larger tax increases in $100k-$500k brackets
+2. **+$59M**: PE shows smaller tax cuts in $30k-$100k brackets
+3. **-$102M**: PE shows larger tax cuts for over $1M bracket
+4. **+$60M**: Various other bracket differences
+
+**Bottom line**: PolicyEngine's model shows the SCIAD phase-out creating more tax increases for upper-middle income taxpayers than RFA estimates, which more than offsets the tax cuts elsewhere.
diff --git a/us/states/sc/rfa_h4216_analysis.csv b/us/states/sc/rfa_h4216_analysis.csv
new file mode 100644
index 0000000..43991c5
--- /dev/null
+++ b/us/states/sc/rfa_h4216_analysis.csv
@@ -0,0 +1,16 @@
+Federal AGI Range,Est # Returns,Est % Returns,Old Avg Tax Liability,New Avg Tax Liability,Returns with Tax Change,% Returns in Range with Change,Old Avg Tax (Changed),New Avg Tax (Changed),Avg Tax Change,Total Dollar Change,Tax Decrease # Returns,Tax Decrease % in Range,Total Decrease Amount,Avg Decrease Amount,Tax Increase # Returns,Tax Increase % in Range,Total Increase Amount,Avg Increase Amount,No Tax Change # Returns,No Change % Returns,Zero Tax # Returns,Zero Tax % Returns
+$0*,78854,2.9%,$50,$43,1080,1.4%,$3683,$3154,-$529,-$571000,575,0.7%,-$606000,-$1054,505,0.6%,$35000,$69,77774,98.6%,77824,98.7%
+$1 to $10000,286253,10.4%,$3,$9,43699,15.3%,$20,$58,$38,$1655000,834,0.3%,-$76000,-$91,42865,15.0%,$1731000,$40,242554,84.7%,243249,85.0%
+$10001 to $20000,310122,11.2%,$16,$26,75652,24.4%,$67,$105,$38,$2872000,5591,1.8%,-$360000,-$64,70060,22.6%,$3232000,$46,234471,75.6%,235107,75.8%
+$20001 to $30000,275560,10.0%,$107,$110,140713,51.1%,$210,$216,$5,$769000,51548,18.7%,-$2676000,-$52,89165,32.4%,$3445000,$39,134847,48.9%,134332,48.7%
+$30001 to $40000,269566,9.8%,$288,$216,160474,59.5%,$483,$362,-$121,-$19360000,131750,48.9%,-$21067000,-$160,28724,10.7%,$1707000,$59,109091,40.5%,110638,41.0%
+$40001 to $50000,234386,8.5%,$569,$390,174112,74.3%,$767,$526,-$241,-$41986000,127503,54.4%,-$46301000,-$363,46609,19.9%,$4315000,$93,60274,25.7%,61884,26.4%
+$50001 to $75000,407593,14.8%,$1192,$990,351715,86.3%,$1381,$1148,-$234,-$82146000,286705,70.3%,-$93552000,-$326,65010,15.9%,$11406000,$175,55877,13.7%,61644,15.1%
+$75001 to $100000,250437,9.1%,$2020,$1874,225176,89.9%,$2247,$2085,-$162,-$36461000,173939,69.5%,-$51076000,-$294,51237,20.5%,$14615000,$285,25261,10.1%,27341,10.9%
+$100001 to $150000,298343,10.8%,$3258,$3269,289966,97.2%,$3352,$3363,$11,$3115000,175398,58.8%,-$35022000,-$200,114568,38.4%,$38137000,$333,8377,2.8%,8450,2.8%
+$150001 to $200000,143398,5.2%,$5518,$5873,141749,98.9%,$5582,$5942,$359,$50933000,19752,13.8%,-$6653000,-$337,121997,85.1%,$57586000,$472,1649,1.1%,1210,0.8%
+$200001 to $300000,109340,4.0%,$8741,$9077,108086,98.9%,$8842,$9182,$340,$36718000,29527,27.0%,-$10562000,-$358,78560,71.8%,$47280000,$602,1253,1.1%,791,0.7%
+$300001 to $500000,56123,2.0%,$14926,$14844,55098,98.2%,$15204,$15120,-$84,-$4627000,36199,64.5%,-$25411000,-$702,18898,33.7%,$20784000,$1100,1025,1.8%,688,1.2%
+$500001 to $1000000,25664,0.9%,$25969,$25338,24764,96.5%,$26912,$26258,-$654,-$16195000,18325,71.4%,-$32991000,-$1800,6439,25.1%,$16796000,$2608,900,3.5%,649,2.5%
+Over $1000000,11936,0.4%,$78228,$77074,11163,93.5%,$83646,$82413,-$1233,-$13767000,8187,68.6%,-$62365000,-$7617,2975,24.9%,$48598000,$16334,773,6.5%,666,5.6%
+Total,2757573,100.0%,$2321,$2277,1803447,65.4%,$3548,$3482,-$66,-$119100000,1065834,38.7%,-$388700000,-$365,737613,26.7%,$269600000,$366,954126,34.6%,964473,35.0%
diff --git a/us/states/sc/sc_h4216_reform_analysis.ipynb b/us/states/sc/sc_h4216_reform_analysis.ipynb
new file mode 100644
index 0000000..425c99b
--- /dev/null
+++ b/us/states/sc/sc_h4216_reform_analysis.ipynb
@@ -0,0 +1,418 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# South Carolina H.4216 Tax Reform Analysis (Tax Year 2026)\n",
+    "\n",
+    "This notebook analyzes the impact of SC H.4216 tax reform.\n",
+    "\n",
+    "## Proposal\n",
+    "- Apply a tax rate of 1.99% on taxable income up to $30,000 and 5.39% over\n",
+    "- Eliminate the federal standard or itemized deduction\n",
+    "- Allow a new SC Income Adjusted Deduction (SCIAD) at certain income levels\n",
+    "- Maintain all other state adjustments, exemptions, and credits\n",
+    "- Cap SC EITC at $200\n",
+    "\n",
+    "## Current 2026 Marginal Tax Rates\n",
+    "- 0% up to $3,640\n",
+    "- 3% $3,640 - $18,230\n",
+    "- 6% over $18,230\n",
+    "\n",
+    "## Proposed Tax Rates\n",
+    "- 1.99% up to $30,000\n",
+    "- 5.39% over $30,000\n",
+    "\n",
+    "## SC Deduction (SCIAD) Phase-out\n",
+    "| Filing Status | Amount | Phase-out Start | Phase-out End |\n",
+    "|---------------|--------|-----------------|---------------|\n",
+    "| Single | $15,000 | $40,000 | $95,000 |\n",
+    "| Married Joint | $30,000 | $80,000 | $190,000 |\n",
+    "| Head of Household | $22,500 | $60,000 | $142,500 |"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from policyengine_us import Microsimulation\n",
+    "from policyengine_us.reforms.states.sc.h4216.sc_h4216 import create_sc_h4216\n",
+    "from policyengine_core.reforms import Reform\n",
+    "import pandas as pd\n",
+    "import numpy as np\n",
+    "\n",
+    "SC_DATASET = \"hf://policyengine/policyengine-us-data/states/SC.h5\"\n",
+    "TAX_YEAR = 2026  # Renamed to avoid conflict with YEAR constant from model_api"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": "from policyengine_us.model_api import *\n\ndef create_h4216_reform():\n    \"\"\"\n    SC H.4216 Reform:\n    - Enable H.4216 via in_effect parameter\n    - Set rates: 1.99% up to $30k, 5.39% over $30k\n    \"\"\"\n    # Parameter changes via Reform.from_dict\n    param_reform = Reform.from_dict(\n        {\n            \"gov.contrib.states.sc.h4216.in_effect\": {\n                \"2026-01-01.2100-12-31\": True\n            },\n            \"gov.contrib.states.sc.h4216.rates[1].rate\": {\n                \"2026-01-01.2100-12-31\": 0.0539\n            }\n        },\n        country_id=\"us\",\n    )\n    \n    # Get base H.4216 reform (EITC cap, SCIAD, taxable income, tax calculation)\n    base_reform = create_sc_h4216()\n    \n    # Order: base reform first, then parameter overrides\n    return (base_reform, param_reform)\n\nprint(\"Reform function defined!\")"
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "print(\"Loading baseline (current SC tax law)...\")\n",
+    "baseline = Microsimulation(dataset=SC_DATASET)\n",
+    "print(\"Baseline loaded\")\n",
+    "\n",
+    "print(\"\\nLoading reform (H.4216 with 5.39% top rate)...\")\n",
+    "reform = create_h4216_reform()\n",
+    "reform_sim = Microsimulation(dataset=SC_DATASET, reform=reform)\n",
+    "print(\"Reform loaded\")\n",
+    "\n",
+    "print(\"\\n\" + \"=\"*60)\n",
+    "print(\"All simulations ready!\")\n",
+    "print(\"=\"*60)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Calculate Tax Impacts by Income Bracket"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Get tax unit level data\n",
+    "baseline_tax = np.array(baseline.calculate(\"sc_income_tax\", period=TAX_YEAR, map_to=\"tax_unit\"))\n",
+    "reform_tax = np.array(reform_sim.calculate(\"sc_income_tax\", period=TAX_YEAR, map_to=\"tax_unit\"))\n",
+    "agi = np.array(baseline.calculate(\"adjusted_gross_income\", period=TAX_YEAR, map_to=\"tax_unit\"))\n",
+    "tax_unit_weight = np.array(baseline.calculate(\"tax_unit_weight\", period=TAX_YEAR))\n",
+    "\n",
+    "# Calculate tax change\n",
+    "tax_change = reform_tax - baseline_tax\n",
+    "\n",
+    "print(f\"Total tax units: {len(baseline_tax):,}\")\n",
+    "print(f\"Weighted tax units (returns): {tax_unit_weight.sum():,.0f}\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Define income brackets matching the RFA analysis\n",
+    "income_brackets = [\n",
+    "    (float('-inf'), 0, \"$0*\"),\n",
+    "    (0, 10000, \"$1 to $10,000\"),\n",
+    "    (10000, 20000, \"$10,001 to $20,000\"),\n",
+    "    (20000, 30000, \"$20,001 to $30,000\"),\n",
+    "    (30000, 40000, \"$30,001 to $40,000\"),\n",
+    "    (40000, 50000, \"$40,001 to $50,000\"),\n",
+    "    (50000, 75000, \"$50,001 to $75,000\"),\n",
+    "    (75000, 100000, \"$75,001 to $100,000\"),\n",
+    "    (100000, 150000, \"$100,001 to $150,000\"),\n",
+    "    (150000, 200000, \"$150,001 to $200,000\"),\n",
+    "    (200000, 300000, \"$200,001 to $300,000\"),\n",
+    "    (300000, 500000, \"$300,001 to $500,000\"),\n",
+    "    (500000, 1000000, \"$500,001 to $1,000,000\"),\n",
+    "    (1000000, float('inf'), \"Over $1,000,000\")\n",
+    "]\n",
+    "\n",
+    "results = []\n",
+    "\n",
+    "for lower, upper, label in income_brackets:\n",
+    "    if lower == float('-inf'):\n",
+    "        mask = agi <= upper\n",
+    "    elif upper == float('inf'):\n",
+    "        mask = agi > lower\n",
+    "    else:\n",
+    "        mask = (agi > lower) & (agi <= upper)\n",
+    "    \n",
+    "    if mask.sum() == 0:\n",
+    "        continue\n",
+    "    \n",
+    "    # Weighted counts\n",
+    "    est_returns = tax_unit_weight[mask].sum()\n",
+    "    pct_returns = est_returns / tax_unit_weight.sum() * 100\n",
+    "    \n",
+    "    # Tax liability\n",
+    "    old_avg_tax = np.average(baseline_tax[mask], weights=tax_unit_weight[mask]) if est_returns > 0 else 0\n",
+    "    new_avg_tax = np.average(reform_tax[mask], weights=tax_unit_weight[mask]) if est_returns > 0 else 0\n",
+    "    \n",
+    "    # Returns with tax change (threshold of $1)\n",
+    "    change_mask = mask & (np.abs(tax_change) > 1)\n",
+    "    returns_with_change = tax_unit_weight[change_mask].sum()\n",
+    "    pct_with_change = returns_with_change / est_returns * 100 if est_returns > 0 else 0\n",
+    "    \n",
+    "    if returns_with_change > 0:\n",
+    "        old_avg_tax_changed = np.average(baseline_tax[change_mask], weights=tax_unit_weight[change_mask])\n",
+    "        new_avg_tax_changed = np.average(reform_tax[change_mask], weights=tax_unit_weight[change_mask])\n",
+    "        avg_change = new_avg_tax_changed - old_avg_tax_changed\n",
+    "    else:\n",
+    "        old_avg_tax_changed = 0\n",
+    "        new_avg_tax_changed = 0\n",
+    "        avg_change = 0\n",
+    "    \n",
+    "    total_change = (tax_change[mask] * tax_unit_weight[mask]).sum()\n",
+    "    \n",
+    "    # Tax decrease\n",
+    "    decrease_mask = mask & (tax_change < -1)\n",
+    "    decrease_returns = tax_unit_weight[decrease_mask].sum()\n",
+    "    decrease_pct = decrease_returns / est_returns * 100 if est_returns > 0 else 0\n",
+    "    total_decrease = (tax_change[decrease_mask] * tax_unit_weight[decrease_mask]).sum() if decrease_returns > 0 else 0\n",
+    "    avg_decrease = np.average(tax_change[decrease_mask], weights=tax_unit_weight[decrease_mask]) if decrease_returns > 0 else 0\n",
+    "    \n",
+    "    # Tax increase\n",
+    "    increase_mask = mask & (tax_change > 1)\n",
+    "    increase_returns = tax_unit_weight[increase_mask].sum()\n",
+    "    increase_pct = increase_returns / est_returns * 100 if est_returns > 0 else 0\n",
+    "    total_increase = (tax_change[increase_mask] * tax_unit_weight[increase_mask]).sum() if increase_returns > 0 else 0\n",
+    "    avg_increase = np.average(tax_change[increase_mask], weights=tax_unit_weight[increase_mask]) if increase_returns > 0 else 0\n",
+    "    \n",
+    "    # No change\n",
+    "    no_change_mask = mask & (np.abs(tax_change) <= 1)\n",
+    "    no_change_returns = tax_unit_weight[no_change_mask].sum()\n",
+    "    no_change_pct = no_change_returns / est_returns * 100 if est_returns > 0 else 0\n",
+    "    \n",
+    "    # Zero tax liability (under reform)\n",
+    "    zero_tax_mask = mask & (reform_tax <= 0)\n",
+    "    zero_tax_returns = tax_unit_weight[zero_tax_mask].sum()\n",
+    "    zero_tax_pct = zero_tax_returns / est_returns * 100 if est_returns > 0 else 0\n",
+    "    \n",
+    "    results.append({\n",
+    "        \"Federal AGI Range\": label,\n",
+    "        \"Est. # Returns\": int(round(est_returns)),\n",
+    "        \"% of Returns\": round(pct_returns, 1),\n",
+    "        \"Old Avg Tax\": int(round(old_avg_tax)),\n",
+    "        \"New Avg Tax\": int(round(new_avg_tax)),\n",
+    "        \"Returns w/ Change\": int(round(returns_with_change)),\n",
+    "        \"% w/ Change\": round(pct_with_change, 1),\n",
+    "        \"Avg Change\": int(round(avg_change)),\n",
+    "        \"Total Change ($)\": int(round(total_change)),\n",
+    "        \"Decrease #\": int(round(decrease_returns)),\n",
+    "        \"Decrease %\": round(decrease_pct, 1),\n",
+    "        \"Total Decrease ($)\": int(round(total_decrease)),\n",
+    "        \"Avg Decrease\": int(round(avg_decrease)),\n",
+    "        \"Increase #\": int(round(increase_returns)),\n",
+    "        \"Increase %\": round(increase_pct, 1),\n",
+    "        \"Total Increase ($)\": int(round(total_increase)),\n",
+    "        \"Avg Increase\": int(round(avg_increase)),\n",
+    "        \"No Change #\": int(round(no_change_returns)),\n",
+    "        \"No Change %\": round(no_change_pct, 1),\n",
+    "        \"Zero Tax #\": int(round(zero_tax_returns)),\n",
+    "        \"Zero Tax %\": round(zero_tax_pct, 1)\n",
+    "    })\n",
+    "\n",
+    "df_results = pd.DataFrame(results)\n",
+    "print(\"Results calculated!\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Calculate totals\n",
+    "total_returns = tax_unit_weight.sum()\n",
+    "total_old_tax = np.average(baseline_tax, weights=tax_unit_weight)\n",
+    "total_new_tax = np.average(reform_tax, weights=tax_unit_weight)\n",
+    "\n",
+    "change_mask_all = np.abs(tax_change) > 1\n",
+    "total_returns_changed = tax_unit_weight[change_mask_all].sum()\n",
+    "total_change_amount = (tax_change * tax_unit_weight).sum()\n",
+    "\n",
+    "decrease_mask_all = tax_change < -1\n",
+    "total_decrease_returns = tax_unit_weight[decrease_mask_all].sum()\n",
+    "total_decrease_amount = (tax_change[decrease_mask_all] * tax_unit_weight[decrease_mask_all]).sum()\n",
+    "\n",
+    "increase_mask_all = tax_change > 1\n",
+    "total_increase_returns = tax_unit_weight[increase_mask_all].sum()\n",
+    "total_increase_amount = (tax_change[increase_mask_all] * tax_unit_weight[increase_mask_all]).sum()\n",
+    "\n",
+    "no_change_mask_all = np.abs(tax_change) <= 1\n",
+    "total_no_change_returns = tax_unit_weight[no_change_mask_all].sum()\n",
+    "\n",
+    "zero_tax_mask_all = reform_tax <= 0\n",
+    "total_zero_tax_returns = tax_unit_weight[zero_tax_mask_all].sum()\n",
+    "\n",
+    "# Add totals row\n",
+    "totals = {\n",
+    "    \"Federal AGI Range\": \"Total\",\n",
+    "    \"Est. # Returns\": int(round(total_returns)),\n",
+    "    \"% of Returns\": 100.0,\n",
+    "    \"Old Avg Tax\": int(round(total_old_tax)),\n",
+    "    \"New Avg Tax\": int(round(total_new_tax)),\n",
+    "    \"Returns w/ Change\": int(round(total_returns_changed)),\n",
+    "    \"% w/ Change\": round(total_returns_changed / total_returns * 100, 1),\n",
+    "    \"Avg Change\": int(round(total_new_tax - total_old_tax)),\n",
+    "    \"Total Change ($)\": int(round(total_change_amount)),\n",
+    "    \"Decrease #\": int(round(total_decrease_returns)),\n",
+    "    \"Decrease %\": round(total_decrease_returns / total_returns * 100, 1),\n",
+    "    \"Total Decrease ($)\": int(round(total_decrease_amount)),\n",
+    "    \"Avg Decrease\": int(round(total_decrease_amount / total_decrease_returns)) if total_decrease_returns > 0 else 0,\n",
+    "    \"Increase #\": int(round(total_increase_returns)),\n",
+    "    \"Increase %\": round(total_increase_returns / total_returns * 100, 1),\n",
+    "    \"Total Increase ($)\": int(round(total_increase_amount)),\n",
+    "    \"Avg Increase\": int(round(total_increase_amount / total_increase_returns)) if total_increase_returns > 0 else 0,\n",
+    "    \"No Change #\": int(round(total_no_change_returns)),\n",
+    "    \"No Change %\": round(total_no_change_returns / total_returns * 100, 1),\n",
+    "    \"Zero Tax #\": int(round(total_zero_tax_returns)),\n",
+    "    \"Zero Tax %\": round(total_zero_tax_returns / total_returns * 100, 1)\n",
+    "}\n",
+    "\n",
+    "df_results = pd.concat([df_results, pd.DataFrame([totals])], ignore_index=True)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Results Summary"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "print(\"=\"*100)\n",
+    "print(\"H. 4216 - ESTIMATED SOUTH CAROLINA INDIVIDUAL INCOME TAX IMPACT\")\n",
+    "print(f\"Tax Year {TAX_YEAR}\")\n",
+    "print(\"=\"*100)\n",
+    "print(f\"\\nProposal: Apply a tax rate of 1.99% on taxable income up to $30,000 and 5.39% over,\")\n",
+    "print(f\"eliminate the federal standard or itemized deduction, allow a new SC deduction at\")\n",
+    "print(f\"certain income levels, and maintain all other state adjustments, exemptions, and credits.\")\n",
+    "print(\"=\"*100)\n",
+    "\n",
+    "# Summary stats\n",
+    "pct_decrease = total_decrease_returns / total_returns * 100\n",
+    "pct_increase = total_increase_returns / total_returns * 100\n",
+    "pct_unchanged = total_no_change_returns / total_returns * 100\n",
+    "\n",
+    "print(f\"\\nImpact: With this tax structure:\")\n",
+    "print(f\"  - {pct_decrease:.1f}% of taxpayers have a LOWER tax liability\")\n",
+    "print(f\"  - {pct_increase:.1f}% of taxpayers have a HIGHER tax liability\")\n",
+    "print(f\"  - {pct_unchanged:.1f}% are UNCHANGED\")\n",
+    "print(f\"\\nGeneral Fund Impact: ${total_change_amount:,.0f}\")\n",
+    "print(\"=\"*100)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Display main results table\n",
+    "display_cols = [\n",
+    "    \"Federal AGI Range\", \"Est. # Returns\", \"% of Returns\", \n",
+    "    \"Old Avg Tax\", \"New Avg Tax\", \"Total Change ($)\",\n",
+    "    \"Decrease #\", \"Decrease %\", \"Increase #\", \"Increase %\",\n",
+    "    \"No Change %\", \"Zero Tax %\"\n",
+    "]\n",
+    "\n",
+    "pd.set_option('display.max_columns', None)\n",
+    "pd.set_option('display.width', None)\n",
+    "pd.set_option('display.float_format', lambda x: f'{x:,.1f}' if isinstance(x, float) else x)\n",
+    "\n",
+    "print(df_results[display_cols].to_string(index=False))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Export full results\n",
+    "df_results.to_csv('sc_h4216_tax_impact_analysis.csv', index=False)\n",
+    "print(\"\\nFull results exported to: sc_h4216_tax_impact_analysis.csv\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Detailed Breakdown Tables"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Tax Return Distribution\n",
+    "print(\"\\n\" + \"=\"*80)\n",
+    "print(\"ESTIMATED TAX RETURN DISTRIBUTION\")\n",
+    "print(\"=\"*80)\n",
+    "dist_cols = [\"Federal AGI Range\", \"Est. # Returns\", \"% of Returns\", \"Old Avg Tax\", \"New Avg Tax\"]\n",
+    "print(df_results[dist_cols].to_string(index=False))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Tax Decrease Summary\n",
+    "print(\"\\n\" + \"=\"*80)\n",
+    "print(\"TAX RETURNS WITH A DECREASE IN LIABILITY\")\n",
+    "print(\"=\"*80)\n",
+    "decrease_cols = [\"Federal AGI Range\", \"Decrease #\", \"Decrease %\", \"Total Decrease ($)\", \"Avg Decrease\"]\n",
+    "print(df_results[decrease_cols].to_string(index=False))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Tax Increase Summary\n",
+    "print(\"\\n\" + \"=\"*80)\n",
+    "print(\"TAX RETURNS WITH AN INCREASE IN LIABILITY\")\n",
+    "print(\"=\"*80)\n",
+    "increase_cols = [\"Federal AGI Range\", \"Increase #\", \"Increase %\", \"Total Increase ($)\", \"Avg Increase\"]\n",
+    "print(df_results[increase_cols].to_string(index=False))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# No Change and Zero Tax\n",
+    "print(\"\\n\" + \"=\"*80)\n",
+    "print(\"TAX RETURNS WITH NO CHANGE / ZERO TAX LIABILITY\")\n",
+    "print(\"=\"*80)\n",
+    "other_cols = [\"Federal AGI Range\", \"No Change #\", \"No Change %\", \"Zero Tax #\", \"Zero Tax %\"]\n",
+    "print(df_results[other_cols].to_string(index=False))"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "name": "python",
+   "version": "3.12.0"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 4
+}
\ No newline at end of file
diff --git a/us/states/sc/sc_h4216_tax_impact_analysis.csv b/us/states/sc/sc_h4216_tax_impact_analysis.csv
new file mode 100644
index 0000000..d9347c6
--- /dev/null
+++ b/us/states/sc/sc_h4216_tax_impact_analysis.csv
@@ -0,0 +1,16 @@
+AGI Range,Est Returns,% Returns,Old Avg Tax,New Avg Tax,Total Change,Decrease %,Increase %,No Change %
+$0*,"619,009",21.1%,$0,$0,$0,0.0%,0.0%,100.0%
+"$1 to $10,000","502,276",17.1%,$0,$0,$0,0.0%,0.0%,100.0%
+"$10,001 to $20,000","279,412",9.5%,$0,$10,"$2,686,016",0.0%,19.3%,80.7%
+"$20,001 to $30,000","252,862",8.6%,$64,$102,"$9,483,900",2.0%,51.8%,46.2%
+"$30,001 to $40,000","215,980",7.4%,$225,$202,"$-5,113,025",40.9%,22.0%,37.0%
+"$40,001 to $50,000","197,525",6.7%,$547,$412,"$-26,503,160",50.6%,27.0%,22.3%
+"$50,001 to $75,000","300,857",10.2%,$822,$745,"$-23,279,076",53.3%,31.6%,15.1%
+"$75,001 to $100,000","177,284",6.0%,"$1,781","$1,710","$-12,547,614",64.0%,31.0%,5.1%
+"$100,001 to $150,000","187,945",6.4%,"$3,292","$3,576","$53,395,056",36.3%,63.1%,0.6%
+"$150,001 to $200,000","73,396",2.5%,"$6,049","$6,776","$53,332,632",6.2%,93.8%,0.0%
+"$200,001 to $300,000","52,882",1.8%,"$9,164","$10,004","$44,394,276",6.0%,93.9%,0.1%
+"$300,001 to $500,000","36,977",1.3%,"$17,163","$18,262","$40,630,812",29.4%,70.6%,0.0%
+"$500,001 to $1,000,000","16,525",0.6%,"$26,140","$27,269","$18,658,860",71.0%,29.0%,0.0%
+"Over $1,000,000","22,686",0.8%,"$139,623","$134,541","$-115,293,904",95.5%,4.5%,0.0%
+Total,"2,935,621",100.0%,"$2,220","$2,234","$39,844,772",20.0%,24.0%,56.0%

From e63527d1b283a09836bde7c03b0613a8b88dc0a9 Mon Sep 17 00:00:00 2001
From: David Trimmer <david@policyengine.org>
Date: Thu, 26 Feb 2026 16:13:12 -0500
Subject: [PATCH 03/12] Add detailed return count and baseline revenue
 comparison

Key findings:
- PE has 7.85x more $0 income returns vs RFA
- PE has ~50% fewer returns in $100k-$300k brackets
- PE has 1.9x more millionaire returns paying 78% higher avg tax
- Total baseline revenue similar ($6.52B vs $6.40B) but composition differs
- PE derives 48% of SC income tax from millionaires vs RFA's 15%

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 us/states/sc/h4216_analysis_comparison.md | 66 +++++++++++++++++++++++
 1 file changed, 66 insertions(+)

diff --git a/us/states/sc/h4216_analysis_comparison.md b/us/states/sc/h4216_analysis_comparison.md
index 294ca6e..8e9695b 100644
--- a/us/states/sc/h4216_analysis_comparison.md
+++ b/us/states/sc/h4216_analysis_comparison.md
@@ -1,5 +1,9 @@
 # SC H.4216 Analysis Comparison: PolicyEngine vs RFA
 
+## Executive Summary
+
+The $159M difference between PolicyEngine (+$39.8M) and RFA (-$119.1M) is driven by **fundamentally different income distributions** in the underlying data, not calculation errors.
+
 ## Summary
 
 | Metric | RFA | PolicyEngine | Difference |
@@ -60,6 +64,51 @@ RFA shows existing tax liability for low-income filers ($50, $3, $16, $107 avg),
 - Different treatment of non-filers
 - CPS data may underrepresent low-income tax filers
 
+## Return Count Comparison (Key Finding)
+
+| AGI Range | RFA Returns | PE Returns | PE/RFA Ratio |
+|-----------|-------------|------------|--------------|
+| $0* | 78,854 | 619,009 | **7.85x** |
+| $1-$10k | 286,253 | 502,276 | 1.75x |
+| $10k-$20k | 310,122 | 279,412 | 0.90x |
+| $20k-$30k | 275,560 | 252,862 | 0.92x |
+| $30k-$40k | 269,566 | 215,980 | 0.80x |
+| $40k-$50k | 234,386 | 197,525 | 0.84x |
+| $50k-$75k | 407,593 | 300,857 | **0.74x** |
+| $75k-$100k | 250,437 | 177,284 | **0.71x** |
+| $100k-$150k | 298,343 | 187,945 | **0.63x** |
+| $150k-$200k | 143,398 | 73,396 | **0.51x** |
+| $200k-$300k | 109,340 | 52,882 | **0.48x** |
+| $300k-$500k | 56,123 | 36,977 | 0.66x |
+| $500k-$1M | 25,664 | 16,525 | 0.64x |
+| Over $1M | 11,936 | 22,686 | **1.90x** |
+| **Total** | **2,757,573** | **2,935,621** | 1.06x |
+
+**Key observations:**
+- PE has **7.85x more** $0 income returns (likely non-filers in CPS)
+- PE has **~50% fewer** returns in $100k-$300k brackets
+- PE has **1.9x more** millionaire returns
+
+## Baseline Tax Liability Comparison
+
+| AGI Range | RFA Avg Tax | PE Avg Tax | Difference |
+|-----------|-------------|------------|------------|
+| $0-$10k | $3-$50 | $0 | PE shows no tax |
+| $50k-$75k | $1,192 | $822 | PE 31% lower |
+| $100k-$150k | $3,258 | $3,292 | Similar |
+| Over $1M | $78,228 | **$139,623** | PE **78% higher** |
+
+## Total Baseline Revenue Comparison
+
+| Bracket | RFA Revenue | PE Revenue | Difference |
+|---------|-------------|------------|------------|
+| $0-$100k | $1.24B | $0.74B | -$0.50B |
+| $100k-$1M | $4.22B | $2.61B | -$1.61B |
+| Over $1M | $0.93B | **$3.17B** | **+$2.23B** |
+| **Total** | **$6.40B** | **$6.52B** | +$0.12B (+1.8%) |
+
+**Critical insight:** Total baseline revenue is similar, but PE derives **48%** of SC income tax from millionaires vs RFA's **15%**.
+
 ## Likely Causes
 
 ### 1. Implementation Details (from PR #7494)
@@ -119,3 +168,20 @@ The $159M difference primarily comes from:
 4. **+$60M**: Various other bracket differences
 
 **Bottom line**: PolicyEngine's model shows the SCIAD phase-out creating more tax increases for upper-middle income taxpayers than RFA estimates, which more than offsets the tax cuts elsewhere.
+
+## Conclusion
+
+The $159M difference is **not primarily a calculation issue** but stems from:
+
+1. **Different income distributions**: PE's CPS-based data has far more millionaires (22.7k vs 12k) paying much higher average taxes ($140k vs $78k)
+
+2. **Different return counts**: PE undercounts middle-income filers ($50k-$300k) by 40-50%
+
+3. **Millionaire impact drives divergence**: H.4216 gives large tax cuts to millionaires. With PE having 2x more millionaires paying 2x higher taxes, the reform's impact on this group dominates.
+
+### Recommendation
+
+To align with RFA, PolicyEngine would need to:
+- Recalibrate SC state weights to match actual tax return distributions
+- Validate millionaire counts and income levels against IRS SOI data
+- Investigate why baseline tax for millionaires is so much higher than RFA

From 13ba17e4844d587d540a80a70a84bb826fb122b2 Mon Sep 17 00:00:00 2001
From: David Trimmer <david@policyengine.org>
Date: Thu, 26 Feb 2026 16:19:33 -0500
Subject: [PATCH 04/12] Clarify PE counts all tax units vs RFA filers only

PE includes non-filers which explains 540k extra returns in $0 bracket

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 us/states/sc/h4216_analysis_comparison.md | 12 ++++++++----
 1 file changed, 8 insertions(+), 4 deletions(-)

diff --git a/us/states/sc/h4216_analysis_comparison.md b/us/states/sc/h4216_analysis_comparison.md
index 8e9695b..b9ffdb6 100644
--- a/us/states/sc/h4216_analysis_comparison.md
+++ b/us/states/sc/h4216_analysis_comparison.md
@@ -85,10 +85,12 @@ RFA shows existing tax liability for low-income filers ($50, $3, $16, $107 avg),
 | **Total** | **2,757,573** | **2,935,621** | 1.06x |
 
 **Key observations:**
-- PE has **7.85x more** $0 income returns (likely non-filers in CPS)
+- PE has **7.85x more** $0 income returns - **PE counts all tax units (including non-filers), RFA only counts actual filers**
 - PE has **~50% fewer** returns in $100k-$300k brackets
 - PE has **1.9x more** millionaire returns
 
+**Important note:** RFA uses actual SC tax return data (filers only). PolicyEngine uses CPS-based data representing all tax units regardless of filing status. This explains the large discrepancy in low-income brackets where many households don't file.
+
 ## Baseline Tax Liability Comparison
 
 | AGI Range | RFA Avg Tax | PE Avg Tax | Difference |
@@ -173,11 +175,13 @@ The $159M difference primarily comes from:
 
 The $159M difference is **not primarily a calculation issue** but stems from:
 
-1. **Different income distributions**: PE's CPS-based data has far more millionaires (22.7k vs 12k) paying much higher average taxes ($140k vs $78k)
+1. **Different populations**: PE counts all tax units (filers + non-filers), RFA counts only actual filers. This explains 540k extra returns in the $0 bracket.
+
+2. **Different income distributions**: PE's CPS-based data has far more millionaires (22.7k vs 12k) paying much higher average taxes ($140k vs $78k)
 
-2. **Different return counts**: PE undercounts middle-income filers ($50k-$300k) by 40-50%
+3. **Different return counts**: PE undercounts middle-income filers ($50k-$300k) by 40-50%
 
-3. **Millionaire impact drives divergence**: H.4216 gives large tax cuts to millionaires. With PE having 2x more millionaires paying 2x higher taxes, the reform's impact on this group dominates.
+4. **Millionaire impact drives divergence**: H.4216 gives large tax cuts to millionaires. With PE having 2x more millionaires paying 2x higher taxes, the reform's impact on this group dominates.
 
 ### Recommendation
 

From 2a193e087aa21ec08db1e9db97e00a1b0e6c957d Mon Sep 17 00:00:00 2001
From: David Trimmer <david@policyengine.org>
Date: Fri, 27 Feb 2026 17:02:41 -0500
Subject: [PATCH 05/12] Update SC H.4216 analysis for PR #7514 fix

- Add implementation note about sc_additions bug fix
- Add RFA comparison section to notebook
- Update comparison markdown with post-fix accuracy (~93%)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 us/states/sc/h4216_analysis_comparison.md   | 10 ++++-
 us/states/sc/sc_h4216_reform_analysis.ipynb | 48 +++++++++------------
 2 files changed, 29 insertions(+), 29 deletions(-)

diff --git a/us/states/sc/h4216_analysis_comparison.md b/us/states/sc/h4216_analysis_comparison.md
index b9ffdb6..d4a235a 100644
--- a/us/states/sc/h4216_analysis_comparison.md
+++ b/us/states/sc/h4216_analysis_comparison.md
@@ -2,7 +2,15 @@
 
 ## Executive Summary
 
-The $159M difference between PolicyEngine (+$39.8M) and RFA (-$119.1M) is driven by **fundamentally different income distributions** in the underlying data, not calculation errors.
+**UPDATE (Feb 2025):** PR #7514 fixed a bug where `sc_additions` (QBI and SALT addbacks) were incorrectly applied under H.4216. Since H.4216 starts from AGI (before federal deductions), addbacks are inappropriate. With this fix, PolicyEngine estimates approximately **-$110.9M** vs RFA's **-$119.1M** (~93% accuracy).
+
+---
+
+### Original Analysis (Pre-Fix)
+
+The original $159M difference between PolicyEngine (+$39.8M) and RFA (-$119.1M) was driven by:
+1. **Bug**: `sc_additions` were being applied when starting from AGI (fixed in PR #7514)
+2. **Different income distributions** in the underlying data
 
 ## Summary
 
diff --git a/us/states/sc/sc_h4216_reform_analysis.ipynb b/us/states/sc/sc_h4216_reform_analysis.ipynb
index 425c99b..ef0dec9 100644
--- a/us/states/sc/sc_h4216_reform_analysis.ipynb
+++ b/us/states/sc/sc_h4216_reform_analysis.ipynb
@@ -3,34 +3,7 @@
   {
    "cell_type": "markdown",
    "metadata": {},
-   "source": [
-    "# South Carolina H.4216 Tax Reform Analysis (Tax Year 2026)\n",
-    "\n",
-    "This notebook analyzes the impact of SC H.4216 tax reform.\n",
-    "\n",
-    "## Proposal\n",
-    "- Apply a tax rate of 1.99% on taxable income up to $30,000 and 5.39% over\n",
-    "- Eliminate the federal standard or itemized deduction\n",
-    "- Allow a new SC Income Adjusted Deduction (SCIAD) at certain income levels\n",
-    "- Maintain all other state adjustments, exemptions, and credits\n",
-    "- Cap SC EITC at $200\n",
-    "\n",
-    "## Current 2026 Marginal Tax Rates\n",
-    "- 0% up to $3,640\n",
-    "- 3% $3,640 - $18,230\n",
-    "- 6% over $18,230\n",
-    "\n",
-    "## Proposed Tax Rates\n",
-    "- 1.99% up to $30,000\n",
-    "- 5.39% over $30,000\n",
-    "\n",
-    "## SC Deduction (SCIAD) Phase-out\n",
-    "| Filing Status | Amount | Phase-out Start | Phase-out End |\n",
-    "|---------------|--------|-----------------|---------------|\n",
-    "| Single | $15,000 | $40,000 | $95,000 |\n",
-    "| Married Joint | $30,000 | $80,000 | $190,000 |\n",
-    "| Head of Household | $22,500 | $60,000 | $142,500 |"
-   ]
+   "source": "# South Carolina H.4216 Tax Reform Analysis (Tax Year 2026)\n\nThis notebook analyzes the impact of SC H.4216 tax reform.\n\n## Proposal\n- Apply a tax rate of 1.99% on taxable income up to $30,000 and 5.39% over\n- Eliminate the federal standard or itemized deduction\n- Allow a new SC Income Adjusted Deduction (SCIAD) at certain income levels\n- Maintain all other state adjustments, exemptions, and credits\n- Cap SC EITC at $200\n\n## Current 2026 Marginal Tax Rates\n- 0% up to $3,640\n- 3% $3,640 - $18,230\n- 6% over $18,230\n\n## Proposed Tax Rates\n- 1.99% up to $30,000\n- 5.39% over $30,000\n\n## SC Deduction (SCIAD) Phase-out\n| Filing Status | Amount | Phase-out Start | Phase-out End |\n|---------------|--------|-----------------|---------------|\n| Single | $15,000 | $40,000 | $95,000 |\n| Married Joint | $30,000 | $80,000 | $190,000 |\n| Head of Household | $22,500 | $60,000 | $142,500 |\n\n## Implementation Note\nThis analysis uses the corrected H.4216 implementation (PR #7514) which properly handles SC additions.\nThe fix removes `sc_additions` from the H.4216 taxable income formula since H.4216 starts from AGI\n(before federal deductions), making addbacks for QBI and SALT inappropriate."
   },
   {
    "cell_type": "code",
@@ -400,6 +373,25 @@
     "other_cols = [\"Federal AGI Range\", \"No Change #\", \"No Change %\", \"Zero Tax #\", \"Zero Tax %\"]\n",
     "print(df_results[other_cols].to_string(index=False))"
    ]
+  },
+  {
+   "cell_type": "markdown",
+   "source": "## Comparison to RFA Fiscal Note\n\nThe SC Revenue & Fiscal Affairs (RFA) Office estimated H.4216 would have a **-$119.1M** General Fund impact.\n\nKey differences between PolicyEngine and RFA estimates:\n- **Population**: PE counts all tax units (filers + non-filers); RFA counts only actual filers\n- **Data source**: PE uses CPS-based synthetic data; RFA uses actual SC tax return data\n- **Income distribution**: PE has different return counts by income bracket, particularly more millionaires",
+   "metadata": {}
+  },
+  {
+   "cell_type": "code",
+   "source": "# Load RFA analysis for comparison\nrfa_df = pd.read_csv('rfa_h4216_analysis.csv')\n\nprint(\"=\"*80)\nprint(\"COMPARISON: PolicyEngine vs RFA Fiscal Note\")\nprint(\"=\"*80)\n\n# RFA total impact\nrfa_total_impact = rfa_df['Total Change'].sum()\npe_total_impact = total_change_amount\n\nprint(f\"\\nGeneral Fund Impact:\")\nprint(f\"  RFA Estimate:         ${rfa_total_impact:>15,.0f}\")\nprint(f\"  PolicyEngine Estimate: ${pe_total_impact:>15,.0f}\")\nprint(f\"  Difference:           ${pe_total_impact - rfa_total_impact:>15,.0f}\")\n\n# Calculate accuracy\naccuracy = 1 - abs(pe_total_impact - rfa_total_impact) / abs(rfa_total_impact)\nprint(f\"\\n  Accuracy vs RFA: {accuracy*100:.1f}%\")\n\n# Return count comparison\nrfa_total_returns = rfa_df['Est. # of Returns'].sum()\nprint(f\"\\nTotal Returns:\")\nprint(f\"  RFA:          {rfa_total_returns:>12,.0f}\")\nprint(f\"  PolicyEngine: {int(total_returns):>12,.0f}\")\nprint(f\"  Difference:   {int(total_returns - rfa_total_returns):>+12,.0f}\")",
+   "metadata": {},
+   "execution_count": null,
+   "outputs": []
+  },
+  {
+   "cell_type": "code",
+   "source": "# Side-by-side comparison by income bracket\nprint(\"\\n\" + \"=\"*80)\nprint(\"IMPACT BY INCOME BRACKET: PolicyEngine vs RFA\")\nprint(\"=\"*80)\n\n# Map PE brackets to RFA brackets for comparison\nbracket_comparison = []\nfor idx, row in df_results.iterrows():\n    if row['Federal AGI Range'] == 'Total':\n        continue\n    \n    # Find matching RFA row\n    rfa_match = rfa_df[rfa_df['Federal AGI Range'] == row['Federal AGI Range']]\n    if len(rfa_match) > 0:\n        rfa_impact = rfa_match['Total Change'].values[0]\n        rfa_returns = rfa_match['Est. # of Returns'].values[0]\n    else:\n        rfa_impact = 0\n        rfa_returns = 0\n    \n    bracket_comparison.append({\n        'AGI Range': row['Federal AGI Range'],\n        'PE Returns': row['Est. # Returns'],\n        'RFA Returns': rfa_returns,\n        'PE Impact': row['Total Change ($)'],\n        'RFA Impact': rfa_impact,\n        'Diff ($)': row['Total Change ($)'] - rfa_impact\n    })\n\ncomparison_df = pd.DataFrame(bracket_comparison)\nprint(comparison_df.to_string(index=False))",
+   "metadata": {},
+   "execution_count": null,
+   "outputs": []
   }
  ],
  "metadata": {

From cb1a92cff7608d4869bfc99952ad2b90911d420f Mon Sep 17 00:00:00 2001
From: David Trimmer <david@policyengine.org>
Date: Fri, 27 Feb 2026 17:07:35 -0500
Subject: [PATCH 06/12] Fix numpy.float32 display error in results table

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 us/states/sc/sc_h4216_reform_analysis.ipynb | 291 +++++++++++++++++---
 1 file changed, 253 insertions(+), 38 deletions(-)

diff --git a/us/states/sc/sc_h4216_reform_analysis.ipynb b/us/states/sc/sc_h4216_reform_analysis.ipynb
index ef0dec9..150ecab 100644
--- a/us/states/sc/sc_h4216_reform_analysis.ipynb
+++ b/us/states/sc/sc_h4216_reform_analysis.ipynb
@@ -3,11 +3,43 @@
   {
    "cell_type": "markdown",
    "metadata": {},
-   "source": "# South Carolina H.4216 Tax Reform Analysis (Tax Year 2026)\n\nThis notebook analyzes the impact of SC H.4216 tax reform.\n\n## Proposal\n- Apply a tax rate of 1.99% on taxable income up to $30,000 and 5.39% over\n- Eliminate the federal standard or itemized deduction\n- Allow a new SC Income Adjusted Deduction (SCIAD) at certain income levels\n- Maintain all other state adjustments, exemptions, and credits\n- Cap SC EITC at $200\n\n## Current 2026 Marginal Tax Rates\n- 0% up to $3,640\n- 3% $3,640 - $18,230\n- 6% over $18,230\n\n## Proposed Tax Rates\n- 1.99% up to $30,000\n- 5.39% over $30,000\n\n## SC Deduction (SCIAD) Phase-out\n| Filing Status | Amount | Phase-out Start | Phase-out End |\n|---------------|--------|-----------------|---------------|\n| Single | $15,000 | $40,000 | $95,000 |\n| Married Joint | $30,000 | $80,000 | $190,000 |\n| Head of Household | $22,500 | $60,000 | $142,500 |\n\n## Implementation Note\nThis analysis uses the corrected H.4216 implementation (PR #7514) which properly handles SC additions.\nThe fix removes `sc_additions` from the H.4216 taxable income formula since H.4216 starts from AGI\n(before federal deductions), making addbacks for QBI and SALT inappropriate."
+   "source": [
+    "# South Carolina H.4216 Tax Reform Analysis (Tax Year 2026)\n",
+    "\n",
+    "This notebook analyzes the impact of SC H.4216 tax reform.\n",
+    "\n",
+    "## Proposal\n",
+    "- Apply a tax rate of 1.99% on taxable income up to $30,000 and 5.39% over\n",
+    "- Eliminate the federal standard or itemized deduction\n",
+    "- Allow a new SC Income Adjusted Deduction (SCIAD) at certain income levels\n",
+    "- Maintain all other state adjustments, exemptions, and credits\n",
+    "- Cap SC EITC at $200\n",
+    "\n",
+    "## Current 2026 Marginal Tax Rates\n",
+    "- 0% up to $3,640\n",
+    "- 3% $3,640 - $18,230\n",
+    "- 6% over $18,230\n",
+    "\n",
+    "## Proposed Tax Rates\n",
+    "- 1.99% up to $30,000\n",
+    "- 5.39% over $30,000\n",
+    "\n",
+    "## SC Deduction (SCIAD) Phase-out\n",
+    "| Filing Status | Amount | Phase-out Start | Phase-out End |\n",
+    "|---------------|--------|-----------------|---------------|\n",
+    "| Single | $15,000 | $40,000 | $95,000 |\n",
+    "| Married Joint | $30,000 | $80,000 | $190,000 |\n",
+    "| Head of Household | $22,500 | $60,000 | $142,500 |\n",
+    "\n",
+    "## Implementation Note\n",
+    "This analysis uses the corrected H.4216 implementation (PR #7514) which properly handles SC additions.\n",
+    "The fix removes `sc_additions` from the H.4216 taxable income formula since H.4216 starts from AGI\n",
+    "(before federal deductions), making addbacks for QBI and SALT inappropriate."
+   ]
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 1,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -23,16 +55,96 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 2,
    "metadata": {},
-   "outputs": [],
-   "source": "from policyengine_us.model_api import *\n\ndef create_h4216_reform():\n    \"\"\"\n    SC H.4216 Reform:\n    - Enable H.4216 via in_effect parameter\n    - Set rates: 1.99% up to $30k, 5.39% over $30k\n    \"\"\"\n    # Parameter changes via Reform.from_dict\n    param_reform = Reform.from_dict(\n        {\n            \"gov.contrib.states.sc.h4216.in_effect\": {\n                \"2026-01-01.2100-12-31\": True\n            },\n            \"gov.contrib.states.sc.h4216.rates[1].rate\": {\n                \"2026-01-01.2100-12-31\": 0.0539\n            }\n        },\n        country_id=\"us\",\n    )\n    \n    # Get base H.4216 reform (EITC cap, SCIAD, taxable income, tax calculation)\n    base_reform = create_sc_h4216()\n    \n    # Order: base reform first, then parameter overrides\n    return (base_reform, param_reform)\n\nprint(\"Reform function defined!\")"
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Reform function defined!\n"
+     ]
+    }
+   ],
+   "source": [
+    "from policyengine_us.model_api import *\n",
+    "\n",
+    "def create_h4216_reform():\n",
+    "    \"\"\"\n",
+    "    SC H.4216 Reform:\n",
+    "    - Enable H.4216 via in_effect parameter\n",
+    "    - Set rates: 1.99% up to $30k, 5.39% over $30k\n",
+    "    \"\"\"\n",
+    "    # Parameter changes via Reform.from_dict\n",
+    "    param_reform = Reform.from_dict(\n",
+    "        {\n",
+    "            \"gov.contrib.states.sc.h4216.in_effect\": {\n",
+    "                \"2026-01-01.2100-12-31\": True\n",
+    "            },\n",
+    "            \"gov.contrib.states.sc.h4216.rates[1].rate\": {\n",
+    "                \"2026-01-01.2100-12-31\": 0.0539\n",
+    "            }\n",
+    "        },\n",
+    "        country_id=\"us\",\n",
+    "    )\n",
+    "    \n",
+    "    # Get base H.4216 reform (EITC cap, SCIAD, taxable income, tax calculation)\n",
+    "    base_reform = create_sc_h4216()\n",
+    "    \n",
+    "    # Order: base reform first, then parameter overrides\n",
+    "    return (base_reform, param_reform)\n",
+    "\n",
+    "print(\"Reform function defined!\")"
+   ]
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 3,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Xet Storage is enabled for this repo, but the 'hf_xet' package is not installed. Falling back to regular HTTP download. For better performance, install the package with: `pip install huggingface_hub[hf_xet]` or `pip install hf_xet`\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Loading baseline (current SC tax law)...\n"
+     ]
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "f31de6f5233c4245a8c658f149d294f6",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "SC.h5:   0%|          | 0.00/55.4M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Baseline loaded\n",
+      "\n",
+      "Loading reform (H.4216 with 5.39% top rate)...\n",
+      "Reform loaded\n",
+      "\n",
+      "============================================================\n",
+      "All simulations ready!\n",
+      "============================================================\n"
+     ]
+    }
+   ],
    "source": [
     "print(\"Loading baseline (current SC tax law)...\")\n",
     "baseline = Microsimulation(dataset=SC_DATASET)\n",
@@ -57,9 +169,18 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 4,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Total tax units: 49,486\n",
+      "Weighted tax units (returns): 2,935,621\n"
+     ]
+    }
+   ],
    "source": [
     "# Get tax unit level data\n",
     "baseline_tax = np.array(baseline.calculate(\"sc_income_tax\", period=TAX_YEAR, map_to=\"tax_unit\"))\n",
@@ -76,9 +197,17 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 5,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Results calculated!\n"
+     ]
+    }
+   ],
    "source": [
     "# Define income brackets matching the RFA analysis\n",
     "income_brackets = [\n",
@@ -189,7 +318,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 6,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -253,9 +382,33 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 7,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "====================================================================================================\n",
+      "H. 4216 - ESTIMATED SOUTH CAROLINA INDIVIDUAL INCOME TAX IMPACT\n",
+      "Tax Year 2026\n",
+      "====================================================================================================\n",
+      "\n",
+      "Proposal: Apply a tax rate of 1.99% on taxable income up to $30,000 and 5.39% over,\n",
+      "eliminate the federal standard or itemized deduction, allow a new SC deduction at\n",
+      "certain income levels, and maintain all other state adjustments, exemptions, and credits.\n",
+      "====================================================================================================\n",
+      "\n",
+      "Impact: With this tax structure:\n",
+      "  - 20.0% of taxpayers have a LOWER tax liability\n",
+      "  - 24.0% of taxpayers have a HIGHER tax liability\n",
+      "  - 56.0% are UNCHANGED\n",
+      "\n",
+      "General Fund Impact: $39,844,772\n",
+      "====================================================================================================\n"
+     ]
+    }
+   ],
    "source": [
     "print(\"=\"*100)\n",
     "print(\"H. 4216 - ESTIMATED SOUTH CAROLINA INDIVIDUAL INCOME TAX IMPACT\")\n",
@@ -284,21 +437,7 @@
    "execution_count": null,
    "metadata": {},
    "outputs": [],
-   "source": [
-    "# Display main results table\n",
-    "display_cols = [\n",
-    "    \"Federal AGI Range\", \"Est. # Returns\", \"% of Returns\", \n",
-    "    \"Old Avg Tax\", \"New Avg Tax\", \"Total Change ($)\",\n",
-    "    \"Decrease #\", \"Decrease %\", \"Increase #\", \"Increase %\",\n",
-    "    \"No Change %\", \"Zero Tax %\"\n",
-    "]\n",
-    "\n",
-    "pd.set_option('display.max_columns', None)\n",
-    "pd.set_option('display.width', None)\n",
-    "pd.set_option('display.float_format', lambda x: f'{x:,.1f}' if isinstance(x, float) else x)\n",
-    "\n",
-    "print(df_results[display_cols].to_string(index=False))"
-   ]
+   "source": "# Display main results table\ndisplay_cols = [\n    \"Federal AGI Range\", \"Est. # Returns\", \"% of Returns\", \n    \"Old Avg Tax\", \"New Avg Tax\", \"Total Change ($)\",\n    \"Decrease #\", \"Decrease %\", \"Increase #\", \"Increase %\",\n    \"No Change %\", \"Zero Tax %\"\n]\n\n# Convert numpy types to native Python types to avoid display issues\ndf_display = df_results[display_cols].copy()\nfor col in df_display.columns:\n    if df_display[col].dtype in ['float32', 'float64']:\n        df_display[col] = df_display[col].astype(float)\n    elif df_display[col].dtype in ['int32', 'int64']:\n        df_display[col] = df_display[col].astype(int)\n\npd.set_option('display.max_columns', None)\npd.set_option('display.width', None)\n\nprint(df_display.to_string(index=False))"
   },
   {
    "cell_type": "code",
@@ -376,22 +515,90 @@
   },
   {
    "cell_type": "markdown",
-   "source": "## Comparison to RFA Fiscal Note\n\nThe SC Revenue & Fiscal Affairs (RFA) Office estimated H.4216 would have a **-$119.1M** General Fund impact.\n\nKey differences between PolicyEngine and RFA estimates:\n- **Population**: PE counts all tax units (filers + non-filers); RFA counts only actual filers\n- **Data source**: PE uses CPS-based synthetic data; RFA uses actual SC tax return data\n- **Income distribution**: PE has different return counts by income bracket, particularly more millionaires",
-   "metadata": {}
+   "metadata": {},
+   "source": [
+    "## Comparison to RFA Fiscal Note\n",
+    "\n",
+    "The SC Revenue & Fiscal Affairs (RFA) Office estimated H.4216 would have a **-$119.1M** General Fund impact.\n",
+    "\n",
+    "Key differences between PolicyEngine and RFA estimates:\n",
+    "- **Population**: PE counts all tax units (filers + non-filers); RFA counts only actual filers\n",
+    "- **Data source**: PE uses CPS-based synthetic data; RFA uses actual SC tax return data\n",
+    "- **Income distribution**: PE has different return counts by income bracket, particularly more millionaires"
+   ]
   },
   {
    "cell_type": "code",
-   "source": "# Load RFA analysis for comparison\nrfa_df = pd.read_csv('rfa_h4216_analysis.csv')\n\nprint(\"=\"*80)\nprint(\"COMPARISON: PolicyEngine vs RFA Fiscal Note\")\nprint(\"=\"*80)\n\n# RFA total impact\nrfa_total_impact = rfa_df['Total Change'].sum()\npe_total_impact = total_change_amount\n\nprint(f\"\\nGeneral Fund Impact:\")\nprint(f\"  RFA Estimate:         ${rfa_total_impact:>15,.0f}\")\nprint(f\"  PolicyEngine Estimate: ${pe_total_impact:>15,.0f}\")\nprint(f\"  Difference:           ${pe_total_impact - rfa_total_impact:>15,.0f}\")\n\n# Calculate accuracy\naccuracy = 1 - abs(pe_total_impact - rfa_total_impact) / abs(rfa_total_impact)\nprint(f\"\\n  Accuracy vs RFA: {accuracy*100:.1f}%\")\n\n# Return count comparison\nrfa_total_returns = rfa_df['Est. # of Returns'].sum()\nprint(f\"\\nTotal Returns:\")\nprint(f\"  RFA:          {rfa_total_returns:>12,.0f}\")\nprint(f\"  PolicyEngine: {int(total_returns):>12,.0f}\")\nprint(f\"  Difference:   {int(total_returns - rfa_total_returns):>+12,.0f}\")",
-   "metadata": {},
    "execution_count": null,
-   "outputs": []
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Load RFA analysis for comparison\n",
+    "rfa_df = pd.read_csv('rfa_h4216_analysis.csv')\n",
+    "\n",
+    "print(\"=\"*80)\n",
+    "print(\"COMPARISON: PolicyEngine vs RFA Fiscal Note\")\n",
+    "print(\"=\"*80)\n",
+    "\n",
+    "# RFA total impact\n",
+    "rfa_total_impact = rfa_df['Total Change'].sum()\n",
+    "pe_total_impact = total_change_amount\n",
+    "\n",
+    "print(f\"\\nGeneral Fund Impact:\")\n",
+    "print(f\"  RFA Estimate:         ${rfa_total_impact:>15,.0f}\")\n",
+    "print(f\"  PolicyEngine Estimate: ${pe_total_impact:>15,.0f}\")\n",
+    "print(f\"  Difference:           ${pe_total_impact - rfa_total_impact:>15,.0f}\")\n",
+    "\n",
+    "# Calculate accuracy\n",
+    "accuracy = 1 - abs(pe_total_impact - rfa_total_impact) / abs(rfa_total_impact)\n",
+    "print(f\"\\n  Accuracy vs RFA: {accuracy*100:.1f}%\")\n",
+    "\n",
+    "# Return count comparison\n",
+    "rfa_total_returns = rfa_df['Est. # of Returns'].sum()\n",
+    "print(f\"\\nTotal Returns:\")\n",
+    "print(f\"  RFA:          {rfa_total_returns:>12,.0f}\")\n",
+    "print(f\"  PolicyEngine: {int(total_returns):>12,.0f}\")\n",
+    "print(f\"  Difference:   {int(total_returns - rfa_total_returns):>+12,.0f}\")"
+   ]
   },
   {
    "cell_type": "code",
-   "source": "# Side-by-side comparison by income bracket\nprint(\"\\n\" + \"=\"*80)\nprint(\"IMPACT BY INCOME BRACKET: PolicyEngine vs RFA\")\nprint(\"=\"*80)\n\n# Map PE brackets to RFA brackets for comparison\nbracket_comparison = []\nfor idx, row in df_results.iterrows():\n    if row['Federal AGI Range'] == 'Total':\n        continue\n    \n    # Find matching RFA row\n    rfa_match = rfa_df[rfa_df['Federal AGI Range'] == row['Federal AGI Range']]\n    if len(rfa_match) > 0:\n        rfa_impact = rfa_match['Total Change'].values[0]\n        rfa_returns = rfa_match['Est. # of Returns'].values[0]\n    else:\n        rfa_impact = 0\n        rfa_returns = 0\n    \n    bracket_comparison.append({\n        'AGI Range': row['Federal AGI Range'],\n        'PE Returns': row['Est. # Returns'],\n        'RFA Returns': rfa_returns,\n        'PE Impact': row['Total Change ($)'],\n        'RFA Impact': rfa_impact,\n        'Diff ($)': row['Total Change ($)'] - rfa_impact\n    })\n\ncomparison_df = pd.DataFrame(bracket_comparison)\nprint(comparison_df.to_string(index=False))",
-   "metadata": {},
    "execution_count": null,
-   "outputs": []
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Side-by-side comparison by income bracket\n",
+    "print(\"\\n\" + \"=\"*80)\n",
+    "print(\"IMPACT BY INCOME BRACKET: PolicyEngine vs RFA\")\n",
+    "print(\"=\"*80)\n",
+    "\n",
+    "# Map PE brackets to RFA brackets for comparison\n",
+    "bracket_comparison = []\n",
+    "for idx, row in df_results.iterrows():\n",
+    "    if row['Federal AGI Range'] == 'Total':\n",
+    "        continue\n",
+    "    \n",
+    "    # Find matching RFA row\n",
+    "    rfa_match = rfa_df[rfa_df['Federal AGI Range'] == row['Federal AGI Range']]\n",
+    "    if len(rfa_match) > 0:\n",
+    "        rfa_impact = rfa_match['Total Change'].values[0]\n",
+    "        rfa_returns = rfa_match['Est. # of Returns'].values[0]\n",
+    "    else:\n",
+    "        rfa_impact = 0\n",
+    "        rfa_returns = 0\n",
+    "    \n",
+    "    bracket_comparison.append({\n",
+    "        'AGI Range': row['Federal AGI Range'],\n",
+    "        'PE Returns': row['Est. # Returns'],\n",
+    "        'RFA Returns': rfa_returns,\n",
+    "        'PE Impact': row['Total Change ($)'],\n",
+    "        'RFA Impact': rfa_impact,\n",
+    "        'Diff ($)': row['Total Change ($)'] - rfa_impact\n",
+    "    })\n",
+    "\n",
+    "comparison_df = pd.DataFrame(bracket_comparison)\n",
+    "print(comparison_df.to_string(index=False))"
+   ]
   }
  ],
  "metadata": {
@@ -401,8 +608,16 @@
    "name": "python3"
   },
   "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
    "name": "python",
-   "version": "3.12.0"
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.11.5"
   }
  },
  "nbformat": 4,

From 6b66f10a325c1b343c53d48b7dab5a098cfd8f20 Mon Sep 17 00:00:00 2001
From: David Trimmer <david@policyengine.org>
Date: Mon, 2 Mar 2026 09:55:50 -0500
Subject: [PATCH 07/12] Add staging dataset analysis and budget impact script

- Add data_exploration_staging.ipynb for staging SC dataset
- Add sc_h4216_budget_impact.py for quick budget impact calculation
- Add staging dataset summary CSV
- Update reform analysis notebook with RFA comparison fixes
- Update tax impact CSV with corrected results (staging data)

Staging vs Production dataset comparison:
- Staging has 17% fewer households (more focused on filers)
- Staging median AGI is 39% higher (0k vs 3k)
- Budget impact with staging: -46.6M (5.21%) / -10.9M (5.39%)
- RFA estimate: -19.1M (93% accuracy with 5.39% rate)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 us/states/sc/data_exploration_staging.ipynb   | 486 ++++++++++++++++++
 us/states/sc/sc_h4216_budget_impact.py        |  68 +++
 us/states/sc/sc_h4216_reform_analysis.ipynb   | 308 ++++++++---
 us/states/sc/sc_h4216_tax_impact_analysis.csv |  32 +-
 .../sc_staging_dataset_summary_weighted.csv   |  22 +
 5 files changed, 840 insertions(+), 76 deletions(-)
 create mode 100644 us/states/sc/data_exploration_staging.ipynb
 create mode 100644 us/states/sc/sc_h4216_budget_impact.py
 create mode 100644 us/states/sc/sc_staging_dataset_summary_weighted.csv

diff --git a/us/states/sc/data_exploration_staging.ipynb b/us/states/sc/data_exploration_staging.ipynb
new file mode 100644
index 0000000..c749cbd
--- /dev/null
+++ b/us/states/sc/data_exploration_staging.ipynb
@@ -0,0 +1,486 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "cell-0",
+   "metadata": {},
+   "source": [
+    "# SC Dataset Exploration (Staging)\n",
+    "\n",
+    "This notebook explores the South Carolina (SC) **staging** dataset to understand household counts, income distribution, and demographic characteristics."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "cell-1",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from policyengine_us import Microsimulation\n",
+    "import pandas as pd\n",
+    "import numpy as np\n",
+    "\n",
+    "SC_DATASET = \"hf://policyengine/policyengine-us-data/staging/states/SC.h5\""
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "id": "cell-2",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Load SC staging dataset\n",
+    "sim = Microsimulation(dataset=SC_DATASET)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "id": "cell-3",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Number of households in dataset: 25,104\n",
+      "Household count (weighted): 1,573,988\n",
+      "Person count (weighted): 4,782,288\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Check dataset size\n",
+    "household_weight = sim.calculate(\"household_weight\", period=2025)\n",
+    "household_count = sim.calculate(\"household_count\", period=2025, map_to=\"household\")\n",
+    "person_count = sim.calculate(\"person_count\", period=2025, map_to=\"household\")\n",
+    "\n",
+    "print(f\"Number of households in dataset: {len(household_weight):,}\")\n",
+    "print(f\"Household count (weighted): {household_count.sum():,.0f}\")\n",
+    "print(f\"Person count (weighted): {person_count.sum():,.0f}\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "id": "cell-4",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "============================================================\n",
+      "INCOME DISTRIBUTION SUMMARY\n",
+      "============================================================\n",
+      "\n",
+      "Household AGI:\n",
+      "  Unweighted median: $70,402\n",
+      "  Weighted median:   $60,027\n",
+      "  Weighted average:  $101,637\n",
+      "\n",
+      "Person AGI:\n",
+      "  Unweighted median: $69,786\n",
+      "  Weighted median:   $56,467\n",
+      "  Weighted average:  $97,281\n",
+      "\n",
+      "Average household size: 3.0\n",
+      "\n",
+      "Weighted household AGI percentiles:\n",
+      "  25th percentile: $25,465\n",
+      "  50th percentile: $60,027\n",
+      "  75th percentile: $108,580\n",
+      "  90th percentile: $162,966\n",
+      "  95th percentile: $262,984\n",
+      "  Max AGI: $331,162,720\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Check income distribution (weighted vs unweighted, household and person level)\n",
+    "agi_household = sim.calculate(\"adjusted_gross_income\", period=2025, map_to=\"household\")\n",
+    "agi_hh_array = np.array(agi_household)\n",
+    "hh_weights = np.array(sim.calculate(\"household_weight\", period=2025))\n",
+    "\n",
+    "agi_person = sim.calculate(\"adjusted_gross_income\", period=2025, map_to=\"person\")\n",
+    "agi_person_array = np.array(agi_person)\n",
+    "person_weights = np.array(sim.calculate(\"person_weight\", period=2025))\n",
+    "\n",
+    "# Weighted percentile calculation\n",
+    "def weighted_percentile(values, weights, percentile):\n",
+    "    sorted_indices = np.argsort(values)\n",
+    "    sorted_values = values[sorted_indices]\n",
+    "    sorted_weights = weights[sorted_indices]\n",
+    "    cumulative_weight = np.cumsum(sorted_weights)\n",
+    "    idx = np.searchsorted(cumulative_weight, cumulative_weight[-1] * percentile / 100)\n",
+    "    return sorted_values[min(idx, len(sorted_values)-1)]\n",
+    "\n",
+    "# Unweighted medians\n",
+    "unweighted_median_hh = np.median(agi_hh_array)\n",
+    "unweighted_median_person = np.median(agi_person_array)\n",
+    "\n",
+    "# Weighted medians\n",
+    "weighted_median_hh = weighted_percentile(agi_hh_array, hh_weights, 50)\n",
+    "weighted_median_person = weighted_percentile(agi_person_array, person_weights, 50)\n",
+    "\n",
+    "# Weighted averages\n",
+    "weighted_avg_hh = np.average(agi_hh_array, weights=hh_weights)\n",
+    "weighted_avg_person = np.average(agi_person_array, weights=person_weights)\n",
+    "\n",
+    "# Average household size\n",
+    "total_persons = person_weights.sum()\n",
+    "total_households = hh_weights.sum()\n",
+    "avg_hh_size = total_persons / total_households\n",
+    "\n",
+    "print(\"=\" * 60)\n",
+    "print(\"INCOME DISTRIBUTION SUMMARY\")\n",
+    "print(\"=\" * 60)\n",
+    "print(f\"\\nHousehold AGI:\")\n",
+    "print(f\"  Unweighted median: ${unweighted_median_hh:,.0f}\")\n",
+    "print(f\"  Weighted median:   ${weighted_median_hh:,.0f}\")\n",
+    "print(f\"  Weighted average:  ${weighted_avg_hh:,.0f}\")\n",
+    "\n",
+    "print(f\"\\nPerson AGI:\")\n",
+    "print(f\"  Unweighted median: ${unweighted_median_person:,.0f}\")\n",
+    "print(f\"  Weighted median:   ${weighted_median_person:,.0f}\")\n",
+    "print(f\"  Weighted average:  ${weighted_avg_person:,.0f}\")\n",
+    "\n",
+    "print(f\"\\nAverage household size: {avg_hh_size:.1f}\")\n",
+    "\n",
+    "print(f\"\\nWeighted household AGI percentiles:\")\n",
+    "print(f\"  25th percentile: ${weighted_percentile(agi_hh_array, hh_weights, 25):,.0f}\")\n",
+    "print(f\"  50th percentile: ${weighted_percentile(agi_hh_array, hh_weights, 50):,.0f}\")\n",
+    "print(f\"  75th percentile: ${weighted_percentile(agi_hh_array, hh_weights, 75):,.0f}\")\n",
+    "print(f\"  90th percentile: ${weighted_percentile(agi_hh_array, hh_weights, 90):,.0f}\")\n",
+    "print(f\"  95th percentile: ${weighted_percentile(agi_hh_array, hh_weights, 95):,.0f}\")\n",
+    "print(f\"  Max AGI: ${agi_hh_array.max():,.0f}\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "id": "cell-5",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "Households with children (weighted):\n",
+      "  Total households with children: 672,174\n",
+      "  Households with 1 child: 330,715\n",
+      "  Households with 2 children: 222,793\n",
+      "  Households with 3+ children: 118,666\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Check households with children\n",
+    "is_child = sim.calculate(\"is_child\", period=2025, map_to=\"person\")\n",
+    "household_id = sim.calculate(\"household_id\", period=2025, map_to=\"person\")\n",
+    "household_weight = sim.calculate(\"household_weight\", period=2025, map_to=\"person\")\n",
+    "\n",
+    "# Create DataFrame\n",
+    "df_households = pd.DataFrame({\n",
+    "    'household_id': household_id,\n",
+    "    'is_child': is_child,\n",
+    "    'household_weight': household_weight\n",
+    "})\n",
+    "\n",
+    "# Count children per household\n",
+    "children_per_household = df_households.groupby('household_id').agg({\n",
+    "    'is_child': 'sum',\n",
+    "    'household_weight': 'first'\n",
+    "}).reset_index()\n",
+    "\n",
+    "# Calculate weighted household counts\n",
+    "total_households_with_children = children_per_household[children_per_household['is_child'] > 0]['household_weight'].sum()\n",
+    "households_with_1_child = children_per_household[children_per_household['is_child'] == 1]['household_weight'].sum()\n",
+    "households_with_2_children = children_per_household[children_per_household['is_child'] == 2]['household_weight'].sum()\n",
+    "households_with_3plus_children = children_per_household[children_per_household['is_child'] >= 3]['household_weight'].sum()\n",
+    "\n",
+    "print(f\"\\nHouseholds with children (weighted):\")\n",
+    "print(f\"  Total households with children: {total_households_with_children:,.0f}\")\n",
+    "print(f\"  Households with 1 child: {households_with_1_child:,.0f}\")\n",
+    "print(f\"  Households with 2 children: {households_with_2_children:,.0f}\")\n",
+    "print(f\"  Households with 3+ children: {households_with_3plus_children:,.0f}\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "id": "cell-6",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "Children by age:\n",
+      "  Total children under 18: 1,161,666\n",
+      "  Children under 6: 345,596\n",
+      "  Children under 3: 164,319\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Check children by age groups\n",
+    "df = pd.DataFrame({\n",
+    "    \"household_id\": sim.calculate(\"household_id\", map_to=\"person\"),\n",
+    "    \"tax_unit_id\": sim.calculate(\"tax_unit_id\", map_to=\"person\"),\n",
+    "    \"person_id\": sim.calculate(\"person_id\", map_to=\"person\"),\n",
+    "    \"age\": sim.calculate(\"age\", map_to=\"person\"),\n",
+    "    \"person_weight\": sim.calculate(\"person_weight\", map_to=\"person\")\n",
+    "})\n",
+    "\n",
+    "# Filter for children and apply weights\n",
+    "children_under_18_df = df[df['age'] < 18]\n",
+    "children_under_6_df = df[df['age'] < 6]\n",
+    "children_under_3_df = df[df['age'] < 3]\n",
+    "\n",
+    "# Calculate weighted totals\n",
+    "total_children = children_under_18_df['person_weight'].sum()\n",
+    "children_under_6 = children_under_6_df['person_weight'].sum()\n",
+    "children_under_3 = children_under_3_df['person_weight'].sum()\n",
+    "\n",
+    "print(f\"\\nChildren by age:\")\n",
+    "print(f\"  Total children under 18: {total_children:,.0f}\")\n",
+    "print(f\"  Children under 6: {children_under_6:,.0f}\")\n",
+    "print(f\"  Children under 3: {children_under_3:,.0f}\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "id": "cell-7",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "=================================================================\n",
+      "SC STAGING DATASET SUMMARY - WEIGHTED (Population Estimates)\n",
+      "=================================================================\n",
+      "                         Metric        Value\n",
+      "     Household count (weighted)    1,573,988\n",
+      "        Person count (weighted)    4,782,288\n",
+      "         Average household size          3.0\n",
+      "  Weighted median household AGI      $60,027\n",
+      " Weighted average household AGI     $101,637\n",
+      "     Weighted median person AGI      $56,467\n",
+      "    Weighted average person AGI      $97,281\n",
+      "Unweighted median household AGI      $70,402\n",
+      "   Unweighted median person AGI      $69,786\n",
+      "  25th percentile household AGI      $25,465\n",
+      "  75th percentile household AGI     $108,580\n",
+      "  90th percentile household AGI     $162,966\n",
+      "  95th percentile household AGI     $262,984\n",
+      "              Max household AGI $331,162,720\n",
+      " Total households with children      672,174\n",
+      "        Households with 1 child      330,715\n",
+      "     Households with 2 children      222,793\n",
+      "    Households with 3+ children      118,666\n",
+      "        Total children under 18    1,161,666\n",
+      "               Children under 6      345,596\n",
+      "               Children under 3      164,319\n",
+      "=================================================================\n",
+      "\n",
+      "Summary saved to: sc_staging_dataset_summary_weighted.csv\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Create comprehensive summary table\n",
+    "summary_data = {\n",
+    "    'Metric': [\n",
+    "        'Household count (weighted)',\n",
+    "        'Person count (weighted)',\n",
+    "        'Average household size',\n",
+    "        'Weighted median household AGI',\n",
+    "        'Weighted average household AGI',\n",
+    "        'Weighted median person AGI',\n",
+    "        'Weighted average person AGI',\n",
+    "        'Unweighted median household AGI',\n",
+    "        'Unweighted median person AGI',\n",
+    "        '25th percentile household AGI',\n",
+    "        '75th percentile household AGI',\n",
+    "        '90th percentile household AGI',\n",
+    "        '95th percentile household AGI',\n",
+    "        'Max household AGI',\n",
+    "        'Total households with children',\n",
+    "        'Households with 1 child',\n",
+    "        'Households with 2 children',\n",
+    "        'Households with 3+ children',\n",
+    "        'Total children under 18',\n",
+    "        'Children under 6',\n",
+    "        'Children under 3'\n",
+    "    ],\n",
+    "    'Value': [\n",
+    "        f\"{household_count.sum():,.0f}\",\n",
+    "        f\"{person_count.sum():,.0f}\",\n",
+    "        f\"{avg_hh_size:.1f}\",\n",
+    "        f\"${weighted_median_hh:,.0f}\",\n",
+    "        f\"${weighted_avg_hh:,.0f}\",\n",
+    "        f\"${weighted_median_person:,.0f}\",\n",
+    "        f\"${weighted_avg_person:,.0f}\",\n",
+    "        f\"${unweighted_median_hh:,.0f}\",\n",
+    "        f\"${unweighted_median_person:,.0f}\",\n",
+    "        f\"${weighted_percentile(agi_hh_array, hh_weights, 25):,.0f}\",\n",
+    "        f\"${weighted_percentile(agi_hh_array, hh_weights, 75):,.0f}\",\n",
+    "        f\"${weighted_percentile(agi_hh_array, hh_weights, 90):,.0f}\",\n",
+    "        f\"${weighted_percentile(agi_hh_array, hh_weights, 95):,.0f}\",\n",
+    "        f\"${agi_hh_array.max():,.0f}\",\n",
+    "        f\"{total_households_with_children:,.0f}\",\n",
+    "        f\"{households_with_1_child:,.0f}\",\n",
+    "        f\"{households_with_2_children:,.0f}\",\n",
+    "        f\"{households_with_3plus_children:,.0f}\",\n",
+    "        f\"{total_children:,.0f}\",\n",
+    "        f\"{children_under_6:,.0f}\",\n",
+    "        f\"{children_under_3:,.0f}\"\n",
+    "    ]\n",
+    "}\n",
+    "\n",
+    "summary_df = pd.DataFrame(summary_data)\n",
+    "\n",
+    "print(\"\\n\" + \"=\"*65)\n",
+    "print(\"SC STAGING DATASET SUMMARY - WEIGHTED (Population Estimates)\")\n",
+    "print(\"=\"*65)\n",
+    "print(summary_df.to_string(index=False))\n",
+    "print(\"=\"*65)\n",
+    "\n",
+    "# Save table\n",
+    "summary_df.to_csv('sc_staging_dataset_summary_weighted.csv', index=False)\n",
+    "print(\"\\nSummary saved to: sc_staging_dataset_summary_weighted.csv\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "id": "cell-8",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "======================================================================\n",
+      "HOUSEHOLDS WITH $0 INCOME\n",
+      "======================================================================\n",
+      "Household count: 11,880\n",
+      "Percentage of all households: 0.75%\n",
+      "======================================================================\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Households with $0 income\n",
+    "agi_hh = np.array(sim.calculate(\"adjusted_gross_income\", period=2025, map_to=\"household\"))\n",
+    "weights = np.array(sim.calculate(\"household_weight\", period=2025))\n",
+    "\n",
+    "zero_income_mask = agi_hh == 0\n",
+    "zero_income_count = weights[zero_income_mask].sum()\n",
+    "total_households = weights.sum()\n",
+    "\n",
+    "print(\"\\n\" + \"=\"*70)\n",
+    "print(\"HOUSEHOLDS WITH $0 INCOME\")\n",
+    "print(\"=\"*70)\n",
+    "print(f\"Household count: {zero_income_count:,.0f}\")\n",
+    "print(f\"Percentage of all households: {zero_income_count / total_households * 100:.2f}%\")\n",
+    "print(\"=\"*70)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "id": "cell-9",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "======================================================================\n",
+      "HOUSEHOLD COUNTS BY INCOME BRACKET\n",
+      "======================================================================\n",
+      "Income Bracket Households % of All Households\n",
+      "       $0-$10k    120,600               7.66%\n",
+      "     $10k-$20k    161,829              10.28%\n",
+      "     $20k-$30k    169,710              10.78%\n",
+      "     $30k-$40k    116,353               7.39%\n",
+      "     $40k-$50k    115,397               7.33%\n",
+      "     $50k-$60k     95,344               6.06%\n",
+      "======================================================================\n",
+      "\n",
+      "Total households in $0-$60k range: 779,233\n",
+      "Percentage of all households in $0-$60k range: 49.51%\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Household counts by income brackets\n",
+    "income_brackets = [\n",
+    "    (0, 10000, \"$0-$10k\"),\n",
+    "    (10000, 20000, \"$10k-$20k\"),\n",
+    "    (20000, 30000, \"$20k-$30k\"),\n",
+    "    (30000, 40000, \"$30k-$40k\"),\n",
+    "    (40000, 50000, \"$40k-$50k\"),\n",
+    "    (50000, 60000, \"$50k-$60k\")\n",
+    "]\n",
+    "\n",
+    "bracket_data = []\n",
+    "for lower, upper, label in income_brackets:\n",
+    "    mask = (agi_hh >= lower) & (agi_hh < upper)\n",
+    "    count = weights[mask].sum()\n",
+    "    pct_of_total = (count / total_households) * 100\n",
+    "    \n",
+    "    bracket_data.append({\n",
+    "        \"Income Bracket\": label,\n",
+    "        \"Households\": f\"{count:,.0f}\",\n",
+    "        \"% of All Households\": f\"{pct_of_total:.2f}%\"\n",
+    "    })\n",
+    "\n",
+    "income_df = pd.DataFrame(bracket_data)\n",
+    "\n",
+    "print(\"\\n\" + \"=\"*70)\n",
+    "print(\"HOUSEHOLD COUNTS BY INCOME BRACKET\")\n",
+    "print(\"=\"*70)\n",
+    "print(income_df.to_string(index=False))\n",
+    "print(\"=\"*70)\n",
+    "\n",
+    "# Total in $0-$60k range\n",
+    "total_in_range = sum([weights[(agi_hh >= lower) & (agi_hh < upper)].sum() for lower, upper, _ in income_brackets])\n",
+    "print(f\"\\nTotal households in $0-$60k range: {total_in_range:,.0f}\")\n",
+    "print(f\"Percentage of all households in $0-$60k range: {total_in_range / total_households * 100:.2f}%\")"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.11.5"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/us/states/sc/sc_h4216_budget_impact.py b/us/states/sc/sc_h4216_budget_impact.py
new file mode 100644
index 0000000..be53250
--- /dev/null
+++ b/us/states/sc/sc_h4216_budget_impact.py
@@ -0,0 +1,68 @@
+"""
+SC H.4216 Budget Impact Analysis
+Simple script to calculate the budgetary impact of H.4216 with default 5.21% top rate.
+"""
+
+from policyengine_us import Microsimulation
+from policyengine_us.reforms.states.sc.h4216.sc_h4216 import create_sc_h4216
+from policyengine_core.reforms import Reform
+import numpy as np
+
+SC_DATASET = "hf://policyengine/policyengine-us-data/staging/states/SC.h5"
+TAX_YEAR = 2026
+
+def create_h4216_reform():
+    """
+    SC H.4216 Reform with default rates:
+    - 1.99% up to $30k
+    - 5.21% over $30k (default)
+    """
+    param_reform = Reform.from_dict(
+        {
+            "gov.contrib.states.sc.h4216.in_effect": {
+                "2026-01-01.2100-12-31": True
+            }
+        },
+        country_id="us",
+    )
+    base_reform = create_sc_h4216()
+    return (base_reform, param_reform)
+
+print("Loading baseline...")
+baseline = Microsimulation(dataset=SC_DATASET)
+
+print("Loading reform (H.4216 with 5.21% top rate)...")
+reform = create_h4216_reform()
+reform_sim = Microsimulation(dataset=SC_DATASET, reform=reform)
+
+# Calculate tax impact - use .values to get raw numpy arrays (avoid MicroSeries auto-weighting)
+baseline_tax = baseline.calculate("sc_income_tax", period=TAX_YEAR, map_to="tax_unit").values
+reform_tax = reform_sim.calculate("sc_income_tax", period=TAX_YEAR, map_to="tax_unit").values
+weight = baseline.calculate("tax_unit_weight", period=TAX_YEAR).values
+
+tax_change = reform_tax - baseline_tax
+budget_impact = (tax_change * weight).sum()
+
+# Summary stats (all using raw numpy arrays, no MicroSeries)
+baseline_revenue = (baseline_tax * weight).sum()
+reform_revenue = (reform_tax * weight).sum()
+total_weight = weight.sum()
+
+pct_decrease = weight[tax_change < -1].sum() / total_weight * 100
+pct_increase = weight[tax_change > 1].sum() / total_weight * 100
+pct_unchanged = weight[np.abs(tax_change) <= 1].sum() / total_weight * 100
+
+print("\n" + "="*60)
+print("SC H.4216 BUDGET IMPACT (5.21% Top Rate)")
+print("="*60)
+print(f"\nBaseline SC Income Tax Revenue: ${baseline_revenue:,.0f}")
+print(f"Reform SC Income Tax Revenue:   ${reform_revenue:,.0f}")
+print(f"\n>>> BUDGET IMPACT: ${budget_impact:,.0f} <<<")
+print(f"\nRFA Estimate: -$119,100,000")
+print(f"Difference from RFA: ${budget_impact - (-119100000):,.0f}")
+print(f"Accuracy: {(1 - abs(budget_impact - (-119100000)) / 119100000) * 100:.1f}%")
+print("\n" + "-"*60)
+print(f"Tax units with DECREASE: {pct_decrease:.1f}%")
+print(f"Tax units with INCREASE: {pct_increase:.1f}%")
+print(f"Tax units UNCHANGED:     {pct_unchanged:.1f}%")
+print("="*60)
diff --git a/us/states/sc/sc_h4216_reform_analysis.ipynb b/us/states/sc/sc_h4216_reform_analysis.ipynb
index 150ecab..9e7cbf2 100644
--- a/us/states/sc/sc_h4216_reform_analysis.ipynb
+++ b/us/states/sc/sc_h4216_reform_analysis.ipynb
@@ -49,7 +49,7 @@
     "import pandas as pd\n",
     "import numpy as np\n",
     "\n",
-    "SC_DATASET = \"hf://policyengine/policyengine-us-data/states/SC.h5\"\n",
+    "SC_DATASET = \"hf://policyengine/policyengine-us-data/staging/states/SC.h5\"\n",
     "TAX_YEAR = 2026  # Renamed to avoid conflict with YEAR constant from model_api"
    ]
   },
@@ -102,38 +102,11 @@
    "execution_count": 3,
    "metadata": {},
    "outputs": [
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "Xet Storage is enabled for this repo, but the 'hf_xet' package is not installed. Falling back to regular HTTP download. For better performance, install the package with: `pip install huggingface_hub[hf_xet]` or `pip install hf_xet`\n"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Loading baseline (current SC tax law)...\n"
-     ]
-    },
-    {
-     "data": {
-      "application/vnd.jupyter.widget-view+json": {
-       "model_id": "f31de6f5233c4245a8c658f149d294f6",
-       "version_major": 2,
-       "version_minor": 0
-      },
-      "text/plain": [
-       "SC.h5:   0%|          | 0.00/55.4M [00:00<?, ?B/s]"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
+      "Loading baseline (current SC tax law)...\n",
       "Baseline loaded\n",
       "\n",
       "Loading reform (H.4216 with 5.39% top rate)...\n",
@@ -176,8 +149,8 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Total tax units: 49,486\n",
-      "Weighted tax units (returns): 2,935,621\n"
+      "Total tax units: 33,248\n",
+      "Weighted tax units (returns): 1,905,181\n"
      ]
     }
    ],
@@ -400,11 +373,11 @@
       "====================================================================================================\n",
       "\n",
       "Impact: With this tax structure:\n",
-      "  - 20.0% of taxpayers have a LOWER tax liability\n",
-      "  - 24.0% of taxpayers have a HIGHER tax liability\n",
-      "  - 56.0% are UNCHANGED\n",
+      "  - 29.7% of taxpayers have a LOWER tax liability\n",
+      "  - 26.8% of taxpayers have a HIGHER tax liability\n",
+      "  - 43.5% are UNCHANGED\n",
       "\n",
-      "General Fund Impact: $39,844,772\n",
+      "General Fund Impact: $-110,942,720\n",
       "====================================================================================================\n"
      ]
     }
@@ -434,16 +407,69 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 8,
    "metadata": {},
-   "outputs": [],
-   "source": "# Display main results table\ndisplay_cols = [\n    \"Federal AGI Range\", \"Est. # Returns\", \"% of Returns\", \n    \"Old Avg Tax\", \"New Avg Tax\", \"Total Change ($)\",\n    \"Decrease #\", \"Decrease %\", \"Increase #\", \"Increase %\",\n    \"No Change %\", \"Zero Tax %\"\n]\n\n# Convert numpy types to native Python types to avoid display issues\ndf_display = df_results[display_cols].copy()\nfor col in df_display.columns:\n    if df_display[col].dtype in ['float32', 'float64']:\n        df_display[col] = df_display[col].astype(float)\n    elif df_display[col].dtype in ['int32', 'int64']:\n        df_display[col] = df_display[col].astype(int)\n\npd.set_option('display.max_columns', None)\npd.set_option('display.width', None)\n\nprint(df_display.to_string(index=False))"
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "     Federal AGI Range  Est. # Returns  % of Returns  Old Avg Tax  New Avg Tax  Total Change ($)  Decrease #  Decrease %  Increase #  Increase %  No Change %  Zero Tax %\n",
+      "                   $0*           58352           3.1            0            0                 0           0    0.000000           0    0.000000   100.000000  100.000000\n",
+      "         $1 to $10,000          168000           8.8            0            0                 0           0    0.000000           0    0.000000   100.000000  100.000000\n",
+      "    $10,001 to $20,000          205689          10.8            0            3            697809           0    0.000000       12906    6.300000    93.699997   93.699997\n",
+      "    $20,001 to $30,000          226431          11.9           33           45           2860578        1427    0.600000       51406   22.700001    76.699997   75.699997\n",
+      "    $30,001 to $40,000          174753           9.2          182          156          -4382816       57708   33.000000       22397   12.800000    54.200001   53.900002\n",
+      "    $40,001 to $50,000          155837           8.2          319          244         -11700509       48322   31.000000       44468   28.500000    40.500000   40.500000\n",
+      "    $50,001 to $75,000          262861          13.8          581          475         -27688580      136898   52.099998       77200   29.400000    18.600000   18.600000\n",
+      "   $75,001 to $100,000          215040          11.3         1338         1161         -38227128      138525   64.400002       50694   23.600000    12.000000   12.300000\n",
+      "  $100,001 to $150,000          278127          14.6         2928         3130          56022196      118122   42.500000      156517   56.299999     1.300000    1.000000\n",
+      "  $150,001 to $200,000           49870           2.6         5124         5814          34402136        1551    3.100000       48319   96.900002     0.000000    0.000000\n",
+      "  $200,001 to $300,000           40779           2.1         9149         9707          22764908        2048    5.000000       38672   94.800003     0.100000    0.000000\n",
+      "  $300,001 to $500,000           42814           2.2        17785        17299         -20835856       35387   82.699997        6631   15.500000     1.900000    1.900000\n",
+      "$500,001 to $1,000,000           13719           0.7        27237        26665          -7850124       13076   95.300003         643    4.700000     0.000000    0.000000\n",
+      "       Over $1,000,000           12909           0.7       113354       104291        -117005352       12703   98.400002         206    1.600000     0.000000    0.000000\n",
+      "                 Total         1905181         100.0         2399         2341        -110942720      565768   29.700001      510059   26.799999    43.500000   43.400002\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Display main results table\n",
+    "display_cols = [\n",
+    "    \"Federal AGI Range\", \"Est. # Returns\", \"% of Returns\", \n",
+    "    \"Old Avg Tax\", \"New Avg Tax\", \"Total Change ($)\",\n",
+    "    \"Decrease #\", \"Decrease %\", \"Increase #\", \"Increase %\",\n",
+    "    \"No Change %\", \"Zero Tax %\"\n",
+    "]\n",
+    "\n",
+    "# Convert numpy types to native Python types to avoid display issues\n",
+    "df_display = df_results[display_cols].copy()\n",
+    "for col in df_display.columns:\n",
+    "    if df_display[col].dtype in ['float32', 'float64']:\n",
+    "        df_display[col] = df_display[col].astype(float)\n",
+    "    elif df_display[col].dtype in ['int32', 'int64']:\n",
+    "        df_display[col] = df_display[col].astype(int)\n",
+    "\n",
+    "pd.set_option('display.max_columns', None)\n",
+    "pd.set_option('display.width', None)\n",
+    "\n",
+    "print(df_display.to_string(index=False))"
+   ]
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 9,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "Full results exported to: sc_h4216_tax_impact_analysis.csv\n"
+     ]
+    }
+   ],
    "source": [
     "# Export full results\n",
     "df_results.to_csv('sc_h4216_tax_impact_analysis.csv', index=False)\n",
@@ -459,9 +485,36 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 10,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "================================================================================\n",
+      "ESTIMATED TAX RETURN DISTRIBUTION\n",
+      "================================================================================\n",
+      "     Federal AGI Range  Est. # Returns  % of Returns  Old Avg Tax  New Avg Tax\n",
+      "                   $0*           58352           3.1            0            0\n",
+      "         $1 to $10,000          168000           8.8            0            0\n",
+      "    $10,001 to $20,000          205689          10.8            0            3\n",
+      "    $20,001 to $30,000          226431          11.9           33           45\n",
+      "    $30,001 to $40,000          174753           9.2          182          156\n",
+      "    $40,001 to $50,000          155837           8.2          319          244\n",
+      "    $50,001 to $75,000          262861          13.8          581          475\n",
+      "   $75,001 to $100,000          215040          11.3         1338         1161\n",
+      "  $100,001 to $150,000          278127          14.6         2928         3130\n",
+      "  $150,001 to $200,000           49870           2.6         5124         5814\n",
+      "  $200,001 to $300,000           40779           2.1         9149         9707\n",
+      "  $300,001 to $500,000           42814           2.2        17785        17299\n",
+      "$500,001 to $1,000,000           13719           0.7        27237        26665\n",
+      "       Over $1,000,000           12909           0.7       113354       104291\n",
+      "                 Total         1905181         100.0         2399         2341\n"
+     ]
+    }
+   ],
    "source": [
     "# Tax Return Distribution\n",
     "print(\"\\n\" + \"=\"*80)\n",
@@ -473,9 +526,36 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 11,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "================================================================================\n",
+      "TAX RETURNS WITH A DECREASE IN LIABILITY\n",
+      "================================================================================\n",
+      "     Federal AGI Range  Decrease #  Decrease %  Total Decrease ($)  Avg Decrease\n",
+      "                   $0*           0    0.000000                   0             0\n",
+      "         $1 to $10,000           0    0.000000                   0             0\n",
+      "    $10,001 to $20,000           0    0.000000                   0             0\n",
+      "    $20,001 to $30,000        1427    0.600000               -8402            -6\n",
+      "    $30,001 to $40,000       57708   33.000000            -5940918          -103\n",
+      "    $40,001 to $50,000       48322   31.000000           -15560643          -322\n",
+      "    $50,001 to $75,000      136898   52.099998           -37521040          -274\n",
+      "   $75,001 to $100,000      138525   64.400002           -52849696          -382\n",
+      "  $100,001 to $150,000      118122   42.500000           -19568998          -166\n",
+      "  $150,001 to $200,000        1551    3.100000             -380708          -246\n",
+      "  $200,001 to $300,000        2048    5.000000             -201820           -99\n",
+      "  $300,001 to $500,000       35387   82.699997           -24901672          -704\n",
+      "$500,001 to $1,000,000       13076   95.300003           -19588270         -1498\n",
+      "       Over $1,000,000       12703   98.400002          -128537088        -10118\n",
+      "                 Total      565768   29.700001          -305059264          -539\n"
+     ]
+    }
+   ],
    "source": [
     "# Tax Decrease Summary\n",
     "print(\"\\n\" + \"=\"*80)\n",
@@ -487,9 +567,36 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 12,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "================================================================================\n",
+      "TAX RETURNS WITH AN INCREASE IN LIABILITY\n",
+      "================================================================================\n",
+      "     Federal AGI Range  Increase #  Increase %  Total Increase ($)  Avg Increase\n",
+      "                   $0*           0    0.000000                   0             0\n",
+      "         $1 to $10,000           0    0.000000                   0             0\n",
+      "    $10,001 to $20,000       12906    6.300000              697809            54\n",
+      "    $20,001 to $30,000       51406   22.700001             2871184            56\n",
+      "    $30,001 to $40,000       22397   12.800000             1558448            70\n",
+      "    $40,001 to $50,000       44468   28.500000             3860133            87\n",
+      "    $50,001 to $75,000       77200   29.400000             9832463           127\n",
+      "   $75,001 to $100,000       50694   23.600000            14622566           288\n",
+      "  $100,001 to $150,000      156517   56.299999            75591424           483\n",
+      "  $150,001 to $200,000       48319   96.900002            34782844           720\n",
+      "  $200,001 to $300,000       38672   94.800003            22966736           594\n",
+      "  $300,001 to $500,000        6631   15.500000             4065817           613\n",
+      "$500,001 to $1,000,000         643    4.700000            11738147         18254\n",
+      "       Over $1,000,000         206    1.600000            11531744         56085\n",
+      "                 Total      510059   26.799999           194119312           381\n"
+     ]
+    }
+   ],
    "source": [
     "# Tax Increase Summary\n",
     "print(\"\\n\" + \"=\"*80)\n",
@@ -501,9 +608,36 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 13,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "================================================================================\n",
+      "TAX RETURNS WITH NO CHANGE / ZERO TAX LIABILITY\n",
+      "================================================================================\n",
+      "     Federal AGI Range  No Change #  No Change %  Zero Tax #  Zero Tax %\n",
+      "                   $0*        58352   100.000000       58352  100.000000\n",
+      "         $1 to $10,000       168000   100.000000      168000  100.000000\n",
+      "    $10,001 to $20,000       192783    93.699997      192783   93.699997\n",
+      "    $20,001 to $30,000       173597    76.699997      171348   75.699997\n",
+      "    $30,001 to $40,000        94648    54.200001       94228   53.900002\n",
+      "    $40,001 to $50,000        63047    40.500000       63047   40.500000\n",
+      "    $50,001 to $75,000        48763    18.600000       48850   18.600000\n",
+      "   $75,001 to $100,000        25821    12.000000       26375   12.300000\n",
+      "  $100,001 to $150,000         3487     1.300000        2748    1.000000\n",
+      "  $150,001 to $200,000            0     0.000000           0    0.000000\n",
+      "  $200,001 to $300,000           59     0.100000           0    0.000000\n",
+      "  $300,001 to $500,000          796     1.900000         796    1.900000\n",
+      "$500,001 to $1,000,000            0     0.000000           0    0.000000\n",
+      "       Over $1,000,000            0     0.000000           0    0.000000\n",
+      "                 Total       829354    43.500000      826527   43.400002\n"
+     ]
+    }
+   ],
    "source": [
     "# No Change and Zero Tax\n",
     "print(\"\\n\" + \"=\"*80)\n",
@@ -529,9 +663,31 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 14,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "================================================================================\n",
+      "COMPARISON: PolicyEngine vs RFA Fiscal Note\n",
+      "================================================================================\n",
+      "\n",
+      "General Fund Impact:\n",
+      "  RFA Estimate:          $   -238,151,000\n",
+      "  PolicyEngine Estimate: $   -110,942,720\n",
+      "  Difference:            $    127,208,280\n",
+      "\n",
+      "  Accuracy vs RFA: 46.6%\n",
+      "\n",
+      "Total Returns:\n",
+      "  RFA:             5,515,148\n",
+      "  PolicyEngine:    1,905,181\n",
+      "  Difference:     -3,609,967\n"
+     ]
+    }
+   ],
    "source": [
     "# Load RFA analysis for comparison\n",
     "rfa_df = pd.read_csv('rfa_h4216_analysis.csv')\n",
@@ -540,21 +696,27 @@
     "print(\"COMPARISON: PolicyEngine vs RFA Fiscal Note\")\n",
     "print(\"=\"*80)\n",
     "\n",
-    "# RFA total impact\n",
-    "rfa_total_impact = rfa_df['Total Change'].sum()\n",
+    "# RFA total impact - parse the dollar string to number\n",
+    "def parse_dollar(val):\n",
+    "    if isinstance(val, str):\n",
+    "        return float(val.replace('$', '').replace(',', '').replace('-', '-'))\n",
+    "    return val\n",
+    "\n",
+    "rfa_df['Total Dollar Change Numeric'] = rfa_df['Total Dollar Change'].apply(parse_dollar)\n",
+    "rfa_total_impact = rfa_df['Total Dollar Change Numeric'].sum()\n",
     "pe_total_impact = total_change_amount\n",
     "\n",
     "print(f\"\\nGeneral Fund Impact:\")\n",
-    "print(f\"  RFA Estimate:         ${rfa_total_impact:>15,.0f}\")\n",
+    "print(f\"  RFA Estimate:          ${rfa_total_impact:>15,.0f}\")\n",
     "print(f\"  PolicyEngine Estimate: ${pe_total_impact:>15,.0f}\")\n",
-    "print(f\"  Difference:           ${pe_total_impact - rfa_total_impact:>15,.0f}\")\n",
+    "print(f\"  Difference:            ${pe_total_impact - rfa_total_impact:>15,.0f}\")\n",
     "\n",
     "# Calculate accuracy\n",
     "accuracy = 1 - abs(pe_total_impact - rfa_total_impact) / abs(rfa_total_impact)\n",
     "print(f\"\\n  Accuracy vs RFA: {accuracy*100:.1f}%\")\n",
     "\n",
     "# Return count comparison\n",
-    "rfa_total_returns = rfa_df['Est. # of Returns'].sum()\n",
+    "rfa_total_returns = rfa_df['Est # Returns'].sum()\n",
     "print(f\"\\nTotal Returns:\")\n",
     "print(f\"  RFA:          {rfa_total_returns:>12,.0f}\")\n",
     "print(f\"  PolicyEngine: {int(total_returns):>12,.0f}\")\n",
@@ -563,9 +725,35 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 15,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "================================================================================\n",
+      "IMPACT BY INCOME BRACKET: PolicyEngine vs RFA\n",
+      "================================================================================\n",
+      "             AGI Range  PE Returns  RFA Returns  PE Impact  RFA Impact     Diff ($)\n",
+      "                   $0*       58352        78854          0   -571000.0     571000.0\n",
+      "         $1 to $10,000      168000            0          0         0.0          0.0\n",
+      "    $10,001 to $20,000      205689            0     697809         0.0     697809.0\n",
+      "    $20,001 to $30,000      226431            0    2860578         0.0    2860578.0\n",
+      "    $30,001 to $40,000      174753            0   -4382816         0.0   -4382816.0\n",
+      "    $40,001 to $50,000      155837            0  -11700509         0.0  -11700509.0\n",
+      "    $50,001 to $75,000      262861            0  -27688580         0.0  -27688580.0\n",
+      "   $75,001 to $100,000      215040            0  -38227128         0.0  -38227128.0\n",
+      "  $100,001 to $150,000      278127            0   56022196         0.0   56022196.0\n",
+      "  $150,001 to $200,000       49870            0   34402136         0.0   34402136.0\n",
+      "  $200,001 to $300,000       40779            0   22764908         0.0   22764908.0\n",
+      "  $300,001 to $500,000       42814            0  -20835856         0.0  -20835856.0\n",
+      "$500,001 to $1,000,000       13719            0   -7850124         0.0   -7850124.0\n",
+      "       Over $1,000,000       12909            0 -117005352         0.0 -117005352.0\n"
+     ]
+    }
+   ],
    "source": [
     "# Side-by-side comparison by income bracket\n",
     "print(\"\\n\" + \"=\"*80)\n",
@@ -581,8 +769,8 @@
     "    # Find matching RFA row\n",
     "    rfa_match = rfa_df[rfa_df['Federal AGI Range'] == row['Federal AGI Range']]\n",
     "    if len(rfa_match) > 0:\n",
-    "        rfa_impact = rfa_match['Total Change'].values[0]\n",
-    "        rfa_returns = rfa_match['Est. # of Returns'].values[0]\n",
+    "        rfa_impact = rfa_match['Total Dollar Change Numeric'].values[0]\n",
+    "        rfa_returns = rfa_match['Est # Returns'].values[0]\n",
     "    else:\n",
     "        rfa_impact = 0\n",
     "        rfa_returns = 0\n",
@@ -622,4 +810,4 @@
  },
  "nbformat": 4,
  "nbformat_minor": 4
-}
\ No newline at end of file
+}
diff --git a/us/states/sc/sc_h4216_tax_impact_analysis.csv b/us/states/sc/sc_h4216_tax_impact_analysis.csv
index d9347c6..79ed7e3 100644
--- a/us/states/sc/sc_h4216_tax_impact_analysis.csv
+++ b/us/states/sc/sc_h4216_tax_impact_analysis.csv
@@ -1,16 +1,16 @@
-AGI Range,Est Returns,% Returns,Old Avg Tax,New Avg Tax,Total Change,Decrease %,Increase %,No Change %
-$0*,"619,009",21.1%,$0,$0,$0,0.0%,0.0%,100.0%
-"$1 to $10,000","502,276",17.1%,$0,$0,$0,0.0%,0.0%,100.0%
-"$10,001 to $20,000","279,412",9.5%,$0,$10,"$2,686,016",0.0%,19.3%,80.7%
-"$20,001 to $30,000","252,862",8.6%,$64,$102,"$9,483,900",2.0%,51.8%,46.2%
-"$30,001 to $40,000","215,980",7.4%,$225,$202,"$-5,113,025",40.9%,22.0%,37.0%
-"$40,001 to $50,000","197,525",6.7%,$547,$412,"$-26,503,160",50.6%,27.0%,22.3%
-"$50,001 to $75,000","300,857",10.2%,$822,$745,"$-23,279,076",53.3%,31.6%,15.1%
-"$75,001 to $100,000","177,284",6.0%,"$1,781","$1,710","$-12,547,614",64.0%,31.0%,5.1%
-"$100,001 to $150,000","187,945",6.4%,"$3,292","$3,576","$53,395,056",36.3%,63.1%,0.6%
-"$150,001 to $200,000","73,396",2.5%,"$6,049","$6,776","$53,332,632",6.2%,93.8%,0.0%
-"$200,001 to $300,000","52,882",1.8%,"$9,164","$10,004","$44,394,276",6.0%,93.9%,0.1%
-"$300,001 to $500,000","36,977",1.3%,"$17,163","$18,262","$40,630,812",29.4%,70.6%,0.0%
-"$500,001 to $1,000,000","16,525",0.6%,"$26,140","$27,269","$18,658,860",71.0%,29.0%,0.0%
-"Over $1,000,000","22,686",0.8%,"$139,623","$134,541","$-115,293,904",95.5%,4.5%,0.0%
-Total,"2,935,621",100.0%,"$2,220","$2,234","$39,844,772",20.0%,24.0%,56.0%
+Federal AGI Range,Est. # Returns,% of Returns,Old Avg Tax,New Avg Tax,Returns w/ Change,% w/ Change,Avg Change,Total Change ($),Decrease #,Decrease %,Total Decrease ($),Avg Decrease,Increase #,Increase %,Total Increase ($),Avg Increase,No Change #,No Change %,Zero Tax #,Zero Tax %
+$0*,58352,3.0999999046325684,0,0,0,0.0,0,0,0,0.0,0,0,0,0.0,0,0,58352,100.0,58352,100.0
+"$1 to $10,000",168000,8.800000190734863,0,0,0,0.0,0,0,0,0.0,0,0,0,0.0,0,0,168000,100.0,168000,100.0
+"$10,001 to $20,000",205689,10.800000190734863,0,3,12906,6.3,54,697809,0,0.0,0,0,12906,6.3,697809,54,192783,93.7,192783,93.7
+"$20,001 to $30,000",226431,11.899999618530273,33,45,52834,23.3,54,2860578,1427,0.6,-8402,-6,51406,22.7,2871184,56,173597,76.7,171348,75.7
+"$30,001 to $40,000",174753,9.199999809265137,182,156,80105,45.8,-55,-4382816,57708,33.0,-5940918,-103,22397,12.8,1558448,70,94648,54.2,94228,53.9
+"$40,001 to $50,000",155837,8.199999809265137,319,244,92790,59.5,-126,-11700509,48322,31.0,-15560643,-322,44468,28.5,3860133,87,63047,40.5,63047,40.5
+"$50,001 to $75,000",262861,13.800000190734863,581,475,214098,81.4,-129,-27688580,136898,52.1,-37521040,-274,77200,29.4,9832463,127,48763,18.6,48850,18.6
+"$75,001 to $100,000",215040,11.300000190734863,1338,1161,189218,88.0,-202,-38227128,138525,64.4,-52849696,-382,50694,23.6,14622566,288,25821,12.0,26375,12.3
+"$100,001 to $150,000",278127,14.600000381469727,2928,3130,274640,98.7,204,56022196,118122,42.5,-19568998,-166,156517,56.3,75591424,483,3487,1.3,2748,1.0
+"$150,001 to $200,000",49870,2.5999999046325684,5124,5814,49870,100.0,690,34402136,1551,3.1,-380708,-246,48319,96.9,34782844,720,0,0.0,0,0.0
+"$200,001 to $300,000",40779,2.0999999046325684,9149,9707,40720,99.9,559,22764908,2048,5.0,-201820,-99,38672,94.8,22966736,594,59,0.1,0,0.0
+"$300,001 to $500,000",42814,2.200000047683716,17785,17299,42018,98.1,-496,-20835856,35387,82.7,-24901672,-704,6631,15.5,4065817,613,796,1.9,796,1.9
+"$500,001 to $1,000,000",13719,0.699999988079071,27237,26665,13719,100.0,-572,-7850124,13076,95.3,-19588270,-1498,643,4.7,11738147,18254,0,0.0,0,0.0
+"Over $1,000,000",12909,0.699999988079071,113354,104291,12909,100.0,-9064,-117005352,12703,98.4,-128537088,-10118,206,1.6,11531744,56085,0,0.0,0,0.0
+Total,1905181,100.0,2399,2341,1075827,56.5,-58,-110942720,565768,29.7,-305059264,-539,510059,26.8,194119312,381,829354,43.5,826527,43.4
diff --git a/us/states/sc/sc_staging_dataset_summary_weighted.csv b/us/states/sc/sc_staging_dataset_summary_weighted.csv
new file mode 100644
index 0000000..0916e13
--- /dev/null
+++ b/us/states/sc/sc_staging_dataset_summary_weighted.csv
@@ -0,0 +1,22 @@
+Metric,Value
+Household count (weighted),"1,573,988"
+Person count (weighted),"4,782,288"
+Average household size,3.0
+Weighted median household AGI,"$60,027"
+Weighted average household AGI,"$101,637"
+Weighted median person AGI,"$56,467"
+Weighted average person AGI,"$97,281"
+Unweighted median household AGI,"$70,402"
+Unweighted median person AGI,"$69,786"
+25th percentile household AGI,"$25,465"
+75th percentile household AGI,"$108,580"
+90th percentile household AGI,"$162,966"
+95th percentile household AGI,"$262,984"
+Max household AGI,"$331,162,720"
+Total households with children,"672,174"
+Households with 1 child,"330,715"
+Households with 2 children,"222,793"
+Households with 3+ children,"118,666"
+Total children under 18,"1,161,666"
+Children under 6,"345,596"
+Children under 3,"164,319"

From 38c8b2c4c223ff393b9804281cf89b849e052908 Mon Sep 17 00:00:00 2001
From: David Trimmer <david@policyengine.org>
Date: Mon, 2 Mar 2026 14:07:10 -0500
Subject: [PATCH 08/12] update

---
 us/states/sc/data_exploration_staging.ipynb   | 128 ++++++++++--------
 .../sc_staging_dataset_summary_weighted.csv   |  40 +++---
 2 files changed, 95 insertions(+), 73 deletions(-)

diff --git a/us/states/sc/data_exploration_staging.ipynb b/us/states/sc/data_exploration_staging.ipynb
index c749cbd..b797ac0 100644
--- a/us/states/sc/data_exploration_staging.ipynb
+++ b/us/states/sc/data_exploration_staging.ipynb
@@ -29,7 +29,29 @@
    "execution_count": 2,
    "id": "cell-2",
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Xet Storage is enabled for this repo, but the 'hf_xet' package is not installed. Falling back to regular HTTP download. For better performance, install the package with: `pip install huggingface_hub[hf_xet]` or `pip install hf_xet`\n"
+     ]
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "2eb0b3ac0b824f52a3a6066931afc5ac",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "SC.h5:   0%|          | 0.00/38.1M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    }
+   ],
    "source": [
     "# Load SC staging dataset\n",
     "sim = Microsimulation(dataset=SC_DATASET)"
@@ -45,9 +67,9 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Number of households in dataset: 25,104\n",
-      "Household count (weighted): 1,573,988\n",
-      "Person count (weighted): 4,782,288\n"
+      "Number of households in dataset: 22,528\n",
+      "Household count (weighted): 1,587,912\n",
+      "Person count (weighted): 4,788,894\n"
      ]
     }
    ],
@@ -77,24 +99,24 @@
       "============================================================\n",
       "\n",
       "Household AGI:\n",
-      "  Unweighted median: $70,402\n",
-      "  Weighted median:   $60,027\n",
-      "  Weighted average:  $101,637\n",
+      "  Unweighted median: $67,907\n",
+      "  Weighted median:   $60,378\n",
+      "  Weighted average:  $105,617\n",
       "\n",
       "Person AGI:\n",
-      "  Unweighted median: $69,786\n",
-      "  Weighted median:   $56,467\n",
-      "  Weighted average:  $97,281\n",
+      "  Unweighted median: $67,460\n",
+      "  Weighted median:   $56,366\n",
+      "  Weighted average:  $100,583\n",
       "\n",
       "Average household size: 3.0\n",
       "\n",
       "Weighted household AGI percentiles:\n",
-      "  25th percentile: $25,465\n",
-      "  50th percentile: $60,027\n",
-      "  75th percentile: $108,580\n",
-      "  90th percentile: $162,966\n",
-      "  95th percentile: $262,984\n",
-      "  Max AGI: $331,162,720\n"
+      "  25th percentile: $27,117\n",
+      "  50th percentile: $60,378\n",
+      "  75th percentile: $105,515\n",
+      "  90th percentile: $153,279\n",
+      "  95th percentile: $237,856\n",
+      "  Max AGI: $353,653,602\n"
      ]
     }
    ],
@@ -170,10 +192,10 @@
      "text": [
       "\n",
       "Households with children (weighted):\n",
-      "  Total households with children: 672,174\n",
-      "  Households with 1 child: 330,715\n",
-      "  Households with 2 children: 222,793\n",
-      "  Households with 3+ children: 118,666\n"
+      "  Total households with children: 637,558\n",
+      "  Households with 1 child: 308,153\n",
+      "  Households with 2 children: 190,106\n",
+      "  Households with 3+ children: 139,299\n"
      ]
     }
    ],
@@ -221,9 +243,9 @@
      "text": [
       "\n",
       "Children by age:\n",
-      "  Total children under 18: 1,161,666\n",
-      "  Children under 6: 345,596\n",
-      "  Children under 3: 164,319\n"
+      "  Total children under 18: 1,157,115\n",
+      "  Children under 6: 350,517\n",
+      "  Children under 3: 177,575\n"
      ]
     }
    ],
@@ -268,27 +290,27 @@
       "SC STAGING DATASET SUMMARY - WEIGHTED (Population Estimates)\n",
       "=================================================================\n",
       "                         Metric        Value\n",
-      "     Household count (weighted)    1,573,988\n",
-      "        Person count (weighted)    4,782,288\n",
+      "     Household count (weighted)    1,587,912\n",
+      "        Person count (weighted)    4,788,894\n",
       "         Average household size          3.0\n",
-      "  Weighted median household AGI      $60,027\n",
-      " Weighted average household AGI     $101,637\n",
-      "     Weighted median person AGI      $56,467\n",
-      "    Weighted average person AGI      $97,281\n",
-      "Unweighted median household AGI      $70,402\n",
-      "   Unweighted median person AGI      $69,786\n",
-      "  25th percentile household AGI      $25,465\n",
-      "  75th percentile household AGI     $108,580\n",
-      "  90th percentile household AGI     $162,966\n",
-      "  95th percentile household AGI     $262,984\n",
-      "              Max household AGI $331,162,720\n",
-      " Total households with children      672,174\n",
-      "        Households with 1 child      330,715\n",
-      "     Households with 2 children      222,793\n",
-      "    Households with 3+ children      118,666\n",
-      "        Total children under 18    1,161,666\n",
-      "               Children under 6      345,596\n",
-      "               Children under 3      164,319\n",
+      "  Weighted median household AGI      $60,378\n",
+      " Weighted average household AGI     $105,617\n",
+      "     Weighted median person AGI      $56,366\n",
+      "    Weighted average person AGI     $100,583\n",
+      "Unweighted median household AGI      $67,907\n",
+      "   Unweighted median person AGI      $67,460\n",
+      "  25th percentile household AGI      $27,117\n",
+      "  75th percentile household AGI     $105,515\n",
+      "  90th percentile household AGI     $153,279\n",
+      "  95th percentile household AGI     $237,856\n",
+      "              Max household AGI $353,653,602\n",
+      " Total households with children      637,558\n",
+      "        Households with 1 child      308,153\n",
+      "     Households with 2 children      190,106\n",
+      "    Households with 3+ children      139,299\n",
+      "        Total children under 18    1,157,115\n",
+      "               Children under 6      350,517\n",
+      "               Children under 3      177,575\n",
       "=================================================================\n",
       "\n",
       "Summary saved to: sc_staging_dataset_summary_weighted.csv\n"
@@ -373,8 +395,8 @@
       "======================================================================\n",
       "HOUSEHOLDS WITH $0 INCOME\n",
       "======================================================================\n",
-      "Household count: 11,880\n",
-      "Percentage of all households: 0.75%\n",
+      "Household count: 9,513\n",
+      "Percentage of all households: 0.60%\n",
       "======================================================================\n"
      ]
     }
@@ -411,16 +433,16 @@
       "HOUSEHOLD COUNTS BY INCOME BRACKET\n",
       "======================================================================\n",
       "Income Bracket Households % of All Households\n",
-      "       $0-$10k    120,600               7.66%\n",
-      "     $10k-$20k    161,829              10.28%\n",
-      "     $20k-$30k    169,710              10.78%\n",
-      "     $30k-$40k    116,353               7.39%\n",
-      "     $40k-$50k    115,397               7.33%\n",
-      "     $50k-$60k     95,344               6.06%\n",
+      "       $0-$10k    136,673               8.61%\n",
+      "     $10k-$20k    154,618               9.74%\n",
+      "     $20k-$30k    148,652               9.36%\n",
+      "     $30k-$40k    125,157               7.88%\n",
+      "     $40k-$50k    121,742               7.67%\n",
+      "     $50k-$60k    101,082               6.37%\n",
       "======================================================================\n",
       "\n",
-      "Total households in $0-$60k range: 779,233\n",
-      "Percentage of all households in $0-$60k range: 49.51%\n"
+      "Total households in $0-$60k range: 787,925\n",
+      "Percentage of all households in $0-$60k range: 49.62%\n"
      ]
     }
    ],
diff --git a/us/states/sc/sc_staging_dataset_summary_weighted.csv b/us/states/sc/sc_staging_dataset_summary_weighted.csv
index 0916e13..e7ac8fa 100644
--- a/us/states/sc/sc_staging_dataset_summary_weighted.csv
+++ b/us/states/sc/sc_staging_dataset_summary_weighted.csv
@@ -1,22 +1,22 @@
 Metric,Value
-Household count (weighted),"1,573,988"
-Person count (weighted),"4,782,288"
+Household count (weighted),"1,587,912"
+Person count (weighted),"4,788,894"
 Average household size,3.0
-Weighted median household AGI,"$60,027"
-Weighted average household AGI,"$101,637"
-Weighted median person AGI,"$56,467"
-Weighted average person AGI,"$97,281"
-Unweighted median household AGI,"$70,402"
-Unweighted median person AGI,"$69,786"
-25th percentile household AGI,"$25,465"
-75th percentile household AGI,"$108,580"
-90th percentile household AGI,"$162,966"
-95th percentile household AGI,"$262,984"
-Max household AGI,"$331,162,720"
-Total households with children,"672,174"
-Households with 1 child,"330,715"
-Households with 2 children,"222,793"
-Households with 3+ children,"118,666"
-Total children under 18,"1,161,666"
-Children under 6,"345,596"
-Children under 3,"164,319"
+Weighted median household AGI,"$60,378"
+Weighted average household AGI,"$105,617"
+Weighted median person AGI,"$56,366"
+Weighted average person AGI,"$100,583"
+Unweighted median household AGI,"$67,907"
+Unweighted median person AGI,"$67,460"
+25th percentile household AGI,"$27,117"
+75th percentile household AGI,"$105,515"
+90th percentile household AGI,"$153,279"
+95th percentile household AGI,"$237,856"
+Max household AGI,"$353,653,602"
+Total households with children,"637,558"
+Households with 1 child,"308,153"
+Households with 2 children,"190,106"
+Households with 3+ children,"139,299"
+Total children under 18,"1,157,115"
+Children under 6,"350,517"
+Children under 3,"177,575"

From 9d7bd1ba69433e050fa915e0c9fb43dc22695ee0 Mon Sep 17 00:00:00 2001
From: David Trimmer <david@policyengine.org>
Date: Fri, 6 Mar 2026 12:32:19 -0500
Subject: [PATCH 09/12] Clean up SC analysis: remove staging, add test dataset
 exploration

- Remove staging dataset files (broken data)
- Add data_exploration_test.ipynb for test dataset (hf://policyengine/test/mar/SC.h5)
- Update all notebooks to use .values for raw arrays (avoid double-weighting)
- Update sc_h4216_budget_impact.py to use test dataset and correct RFA estimate
- Update sc_h4216_reform_analysis.ipynb to use test dataset
- Add sc_h4216_dataset_comparison.py comparing production vs test datasets

RFA estimates:
- 5.21% rate: -$309M
- 5.39% rate: -$119.1M

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 us/states/sc/data_exploration.ipynb           | 155 +---------
 ...ging.ipynb => data_exploration_test.ipynb} | 276 ++++--------------
 us/states/sc/sc_h4216_budget_impact.py        |   8 +-
 us/states/sc/sc_h4216_dataset_comparison.py   |  92 ++++++
 us/states/sc/sc_h4216_reform_analysis.ipynb   | 234 ++++++++-------
 us/states/sc/sc_h4216_tax_impact_analysis.csv |  30 +-
 .../sc_staging_dataset_summary_weighted.csv   |  22 --
 7 files changed, 307 insertions(+), 510 deletions(-)
 rename us/states/sc/{data_exploration_staging.ipynb => data_exploration_test.ipynb} (57%)
 create mode 100644 us/states/sc/sc_h4216_dataset_comparison.py
 delete mode 100644 us/states/sc/sc_staging_dataset_summary_weighted.csv

diff --git a/us/states/sc/data_exploration.ipynb b/us/states/sc/data_exploration.ipynb
index 09787fd..b4ba407 100644
--- a/us/states/sc/data_exploration.ipynb
+++ b/us/states/sc/data_exploration.ipynb
@@ -34,172 +34,45 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 3,
+   "execution_count": null,
    "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Number of households in dataset: 35,324\n",
-      "Household count (weighted): 1,887,388\n",
-      "Person count (weighted): 5,451,832\n"
-     ]
-    }
-   ],
-   "source": [
-    "# Check dataset size\n",
-    "household_weight = sim.calculate(\"household_weight\", period=2025)\n",
-    "household_count = sim.calculate(\"household_count\", period=2025, map_to=\"household\")\n",
-    "person_count = sim.calculate(\"person_count\", period=2025, map_to=\"household\")\n",
-    "\n",
-    "print(f\"Number of households in dataset: {len(household_weight):,}\")\n",
-    "print(f\"Household count (weighted): {household_count.sum():,.0f}\")\n",
-    "print(f\"Person count (weighted): {person_count.sum():,.0f}\")"
-   ]
+   "outputs": [],
+   "source": "# Check dataset size - use .values to get raw arrays (avoid MicroSeries auto-weighting)\nhousehold_weight = sim.calculate(\"household_weight\", period=2025).values\nhousehold_count = sim.calculate(\"household_count\", period=2025, map_to=\"household\").values\nperson_count = sim.calculate(\"person_count\", period=2025, map_to=\"household\").values\n\n# Weighted sums using raw arrays\nweighted_household_count = (household_count * household_weight).sum()\nweighted_person_count = (person_count * household_weight).sum()\n\nprint(f\"Number of households in dataset: {len(household_weight):,}\")\nprint(f\"Household count (weighted): {weighted_household_count:,.0f}\")\nprint(f\"Person count (weighted): {weighted_person_count:,.0f}\")"
   },
   {
    "cell_type": "code",
    "execution_count": null,
    "metadata": {},
    "outputs": [],
-   "source": "# Check income distribution (weighted vs unweighted, household and person level)\nagi_household = sim.calculate(\"adjusted_gross_income\", period=2025, map_to=\"household\")\nagi_hh_array = np.array(agi_household)\nhh_weights = np.array(sim.calculate(\"household_weight\", period=2025))\n\nagi_person = sim.calculate(\"adjusted_gross_income\", period=2025, map_to=\"person\")\nagi_person_array = np.array(agi_person)\nperson_weights = np.array(sim.calculate(\"person_weight\", period=2025))\n\n# Weighted percentile calculation\ndef weighted_percentile(values, weights, percentile):\n    sorted_indices = np.argsort(values)\n    sorted_values = values[sorted_indices]\n    sorted_weights = weights[sorted_indices]\n    cumulative_weight = np.cumsum(sorted_weights)\n    idx = np.searchsorted(cumulative_weight, cumulative_weight[-1] * percentile / 100)\n    return sorted_values[min(idx, len(sorted_values)-1)]\n\n# Unweighted medians\nunweighted_median_hh = np.median(agi_hh_array)\nunweighted_median_person = np.median(agi_person_array)\n\n# Weighted medians\nweighted_median_hh = weighted_percentile(agi_hh_array, hh_weights, 50)\nweighted_median_person = weighted_percentile(agi_person_array, person_weights, 50)\n\n# Weighted averages\nweighted_avg_hh = np.average(agi_hh_array, weights=hh_weights)\nweighted_avg_person = np.average(agi_person_array, weights=person_weights)\n\n# Average household size\ntotal_persons = person_weights.sum()\ntotal_households = hh_weights.sum()\navg_hh_size = total_persons / total_households\n\nprint(\"=\" * 60)\nprint(\"INCOME DISTRIBUTION SUMMARY\")\nprint(\"=\" * 60)\nprint(f\"\\nHousehold AGI:\")\nprint(f\"  Unweighted median: ${unweighted_median_hh:,.0f}\")\nprint(f\"  Weighted median:   ${weighted_median_hh:,.0f}\")\nprint(f\"  Weighted average:  ${weighted_avg_hh:,.0f}\")\n\nprint(f\"\\nPerson AGI:\")\nprint(f\"  Unweighted median: ${unweighted_median_person:,.0f}\")\nprint(f\"  Weighted median:   ${weighted_median_person:,.0f}\")\nprint(f\"  Weighted average:  ${weighted_avg_person:,.0f}\")\n\nprint(f\"\\nAverage household size: {avg_hh_size:.1f}\")\n\nprint(f\"\\nWeighted household AGI percentiles:\")\nprint(f\"  25th percentile: ${weighted_percentile(agi_hh_array, hh_weights, 25):,.0f}\")\nprint(f\"  50th percentile: ${weighted_percentile(agi_hh_array, hh_weights, 50):,.0f}\")\nprint(f\"  75th percentile: ${weighted_percentile(agi_hh_array, hh_weights, 75):,.0f}\")\nprint(f\"  90th percentile: ${weighted_percentile(agi_hh_array, hh_weights, 90):,.0f}\")\nprint(f\"  95th percentile: ${weighted_percentile(agi_hh_array, hh_weights, 95):,.0f}\")\nprint(f\"  Max AGI: ${agi_hh_array.max():,.0f}\")"
+   "source": "# Check income distribution (weighted vs unweighted, household and person level)\n# Use .values to get raw numpy arrays (avoid MicroSeries auto-weighting)\nagi_hh_array = sim.calculate(\"adjusted_gross_income\", period=2025, map_to=\"household\").values\nhh_weights = sim.calculate(\"household_weight\", period=2025).values\n\nagi_person_array = sim.calculate(\"adjusted_gross_income\", period=2025, map_to=\"person\").values\nperson_weights = sim.calculate(\"person_weight\", period=2025).values\n\n# Weighted percentile calculation\ndef weighted_percentile(values, weights, percentile):\n    sorted_indices = np.argsort(values)\n    sorted_values = values[sorted_indices]\n    sorted_weights = weights[sorted_indices]\n    cumulative_weight = np.cumsum(sorted_weights)\n    idx = np.searchsorted(cumulative_weight, cumulative_weight[-1] * percentile / 100)\n    return sorted_values[min(idx, len(sorted_values)-1)]\n\n# Unweighted medians\nunweighted_median_hh = np.median(agi_hh_array)\nunweighted_median_person = np.median(agi_person_array)\n\n# Weighted medians\nweighted_median_hh = weighted_percentile(agi_hh_array, hh_weights, 50)\nweighted_median_person = weighted_percentile(agi_person_array, person_weights, 50)\n\n# Weighted averages\nweighted_avg_hh = np.average(agi_hh_array, weights=hh_weights)\nweighted_avg_person = np.average(agi_person_array, weights=person_weights)\n\n# Average household size\ntotal_persons = person_weights.sum()\ntotal_households = hh_weights.sum()\navg_hh_size = total_persons / total_households\n\nprint(\"=\" * 60)\nprint(\"INCOME DISTRIBUTION SUMMARY\")\nprint(\"=\" * 60)\nprint(f\"\\nHousehold AGI:\")\nprint(f\"  Unweighted median: ${unweighted_median_hh:,.0f}\")\nprint(f\"  Weighted median:   ${weighted_median_hh:,.0f}\")\nprint(f\"  Weighted average:  ${weighted_avg_hh:,.0f}\")\n\nprint(f\"\\nPerson AGI:\")\nprint(f\"  Unweighted median: ${unweighted_median_person:,.0f}\")\nprint(f\"  Weighted median:   ${weighted_median_person:,.0f}\")\nprint(f\"  Weighted average:  ${weighted_avg_person:,.0f}\")\n\nprint(f\"\\nAverage household size: {avg_hh_size:.1f}\")\n\nprint(f\"\\nWeighted household AGI percentiles:\")\nprint(f\"  25th percentile: ${weighted_percentile(agi_hh_array, hh_weights, 25):,.0f}\")\nprint(f\"  50th percentile: ${weighted_percentile(agi_hh_array, hh_weights, 50):,.0f}\")\nprint(f\"  75th percentile: ${weighted_percentile(agi_hh_array, hh_weights, 75):,.0f}\")\nprint(f\"  90th percentile: ${weighted_percentile(agi_hh_array, hh_weights, 90):,.0f}\")\nprint(f\"  95th percentile: ${weighted_percentile(agi_hh_array, hh_weights, 95):,.0f}\")\nprint(f\"  Max AGI: ${agi_hh_array.max():,.0f}\")"
   },
   {
    "cell_type": "code",
-   "execution_count": 5,
+   "execution_count": null,
    "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "Households with children (weighted):\n",
-      "  Total households with children: 598,564\n",
-      "  Households with 1 child: 247,956\n",
-      "  Households with 2 children: 190,545\n",
-      "  Households with 3+ children: 160,063\n"
-     ]
-    }
-   ],
-   "source": [
-    "# Check households with children\n",
-    "is_child = sim.calculate(\"is_child\", period=2025, map_to=\"person\")\n",
-    "household_id = sim.calculate(\"household_id\", period=2025, map_to=\"person\")\n",
-    "household_weight = sim.calculate(\"household_weight\", period=2025, map_to=\"person\")\n",
-    "\n",
-    "# Create DataFrame\n",
-    "df_households = pd.DataFrame({\n",
-    "    'household_id': household_id,\n",
-    "    'is_child': is_child,\n",
-    "    'household_weight': household_weight\n",
-    "})\n",
-    "\n",
-    "# Count children per household\n",
-    "children_per_household = df_households.groupby('household_id').agg({\n",
-    "    'is_child': 'sum',\n",
-    "    'household_weight': 'first'\n",
-    "}).reset_index()\n",
-    "\n",
-    "# Calculate weighted household counts\n",
-    "total_households_with_children = children_per_household[children_per_household['is_child'] > 0]['household_weight'].sum()\n",
-    "households_with_1_child = children_per_household[children_per_household['is_child'] == 1]['household_weight'].sum()\n",
-    "households_with_2_children = children_per_household[children_per_household['is_child'] == 2]['household_weight'].sum()\n",
-    "households_with_3plus_children = children_per_household[children_per_household['is_child'] >= 3]['household_weight'].sum()\n",
-    "\n",
-    "print(f\"\\nHouseholds with children (weighted):\")\n",
-    "print(f\"  Total households with children: {total_households_with_children:,.0f}\")\n",
-    "print(f\"  Households with 1 child: {households_with_1_child:,.0f}\")\n",
-    "print(f\"  Households with 2 children: {households_with_2_children:,.0f}\")\n",
-    "print(f\"  Households with 3+ children: {households_with_3plus_children:,.0f}\")"
-   ]
+   "outputs": [],
+   "source": "# Check households with children - use .values for raw arrays\nis_child = sim.calculate(\"is_child\", period=2025, map_to=\"person\").values\nhousehold_id = sim.calculate(\"household_id\", period=2025, map_to=\"person\").values\nhousehold_weight_person = sim.calculate(\"household_weight\", period=2025, map_to=\"person\").values\n\n# Create DataFrame\ndf_households = pd.DataFrame({\n    'household_id': household_id,\n    'is_child': is_child,\n    'household_weight': household_weight_person\n})\n\n# Count children per household\nchildren_per_household = df_households.groupby('household_id').agg({\n    'is_child': 'sum',\n    'household_weight': 'first'\n}).reset_index()\n\n# Calculate weighted household counts\ntotal_households_with_children = children_per_household[children_per_household['is_child'] > 0]['household_weight'].sum()\nhouseholds_with_1_child = children_per_household[children_per_household['is_child'] == 1]['household_weight'].sum()\nhouseholds_with_2_children = children_per_household[children_per_household['is_child'] == 2]['household_weight'].sum()\nhouseholds_with_3plus_children = children_per_household[children_per_household['is_child'] >= 3]['household_weight'].sum()\n\nprint(f\"\\nHouseholds with children (weighted):\")\nprint(f\"  Total households with children: {total_households_with_children:,.0f}\")\nprint(f\"  Households with 1 child: {households_with_1_child:,.0f}\")\nprint(f\"  Households with 2 children: {households_with_2_children:,.0f}\")\nprint(f\"  Households with 3+ children: {households_with_3plus_children:,.0f}\")"
   },
   {
    "cell_type": "code",
-   "execution_count": 6,
+   "execution_count": null,
    "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "Children by age:\n",
-      "  Total children under 18: 1,198,147\n",
-      "  Children under 6: 349,101\n",
-      "  Children under 3: 169,412\n"
-     ]
-    }
-   ],
-   "source": [
-    "# Check children by age groups\n",
-    "df = pd.DataFrame({\n",
-    "    \"household_id\": sim.calculate(\"household_id\", map_to=\"person\"),\n",
-    "    \"tax_unit_id\": sim.calculate(\"tax_unit_id\", map_to=\"person\"),\n",
-    "    \"person_id\": sim.calculate(\"person_id\", map_to=\"person\"),\n",
-    "    \"age\": sim.calculate(\"age\", map_to=\"person\"),\n",
-    "    \"person_weight\": sim.calculate(\"person_weight\", map_to=\"person\")\n",
-    "})\n",
-    "\n",
-    "# Filter for children and apply weights\n",
-    "children_under_18_df = df[df['age'] < 18]\n",
-    "children_under_6_df = df[df['age'] < 6]\n",
-    "children_under_3_df = df[df['age'] < 3]\n",
-    "\n",
-    "# Calculate weighted totals\n",
-    "total_children = children_under_18_df['person_weight'].sum()\n",
-    "children_under_6 = children_under_6_df['person_weight'].sum()\n",
-    "children_under_3 = children_under_3_df['person_weight'].sum()\n",
-    "\n",
-    "print(f\"\\nChildren by age:\")\n",
-    "print(f\"  Total children under 18: {total_children:,.0f}\")\n",
-    "print(f\"  Children under 6: {children_under_6:,.0f}\")\n",
-    "print(f\"  Children under 3: {children_under_3:,.0f}\")"
-   ]
+   "outputs": [],
+   "source": "# Check children by age groups - use .values for raw arrays\ndf = pd.DataFrame({\n    \"household_id\": sim.calculate(\"household_id\", map_to=\"person\").values,\n    \"tax_unit_id\": sim.calculate(\"tax_unit_id\", map_to=\"person\").values,\n    \"person_id\": sim.calculate(\"person_id\", map_to=\"person\").values,\n    \"age\": sim.calculate(\"age\", map_to=\"person\").values,\n    \"person_weight\": sim.calculate(\"person_weight\", map_to=\"person\").values\n})\n\n# Filter for children and apply weights\nchildren_under_18_df = df[df['age'] < 18]\nchildren_under_6_df = df[df['age'] < 6]\nchildren_under_3_df = df[df['age'] < 3]\n\n# Calculate weighted totals\ntotal_children = children_under_18_df['person_weight'].sum()\nchildren_under_6 = children_under_6_df['person_weight'].sum()\nchildren_under_3 = children_under_3_df['person_weight'].sum()\n\nprint(f\"\\nChildren by age:\")\nprint(f\"  Total children under 18: {total_children:,.0f}\")\nprint(f\"  Children under 6: {children_under_6:,.0f}\")\nprint(f\"  Children under 3: {children_under_3:,.0f}\")"
   },
   {
    "cell_type": "code",
    "execution_count": null,
    "metadata": {},
    "outputs": [],
-   "source": "# Create comprehensive summary table\nsummary_data = {\n    'Metric': [\n        'Household count (weighted)',\n        'Person count (weighted)',\n        'Average household size',\n        'Weighted median household AGI',\n        'Weighted average household AGI',\n        'Weighted median person AGI',\n        'Weighted average person AGI',\n        'Unweighted median household AGI',\n        'Unweighted median person AGI',\n        '25th percentile household AGI',\n        '75th percentile household AGI',\n        '90th percentile household AGI',\n        '95th percentile household AGI',\n        'Max household AGI',\n        'Total households with children',\n        'Households with 1 child',\n        'Households with 2 children',\n        'Households with 3+ children',\n        'Total children under 18',\n        'Children under 6',\n        'Children under 3'\n    ],\n    'Value': [\n        f\"{household_count.sum():,.0f}\",\n        f\"{person_count.sum():,.0f}\",\n        f\"{avg_hh_size:.1f}\",\n        f\"${weighted_median_hh:,.0f}\",\n        f\"${weighted_avg_hh:,.0f}\",\n        f\"${weighted_median_person:,.0f}\",\n        f\"${weighted_avg_person:,.0f}\",\n        f\"${unweighted_median_hh:,.0f}\",\n        f\"${unweighted_median_person:,.0f}\",\n        f\"${weighted_percentile(agi_hh_array, hh_weights, 25):,.0f}\",\n        f\"${weighted_percentile(agi_hh_array, hh_weights, 75):,.0f}\",\n        f\"${weighted_percentile(agi_hh_array, hh_weights, 90):,.0f}\",\n        f\"${weighted_percentile(agi_hh_array, hh_weights, 95):,.0f}\",\n        f\"${agi_hh_array.max():,.0f}\",\n        f\"{total_households_with_children:,.0f}\",\n        f\"{households_with_1_child:,.0f}\",\n        f\"{households_with_2_children:,.0f}\",\n        f\"{households_with_3plus_children:,.0f}\",\n        f\"{total_children:,.0f}\",\n        f\"{children_under_6:,.0f}\",\n        f\"{children_under_3:,.0f}\"\n    ]\n}\n\nsummary_df = pd.DataFrame(summary_data)\n\nprint(\"\\n\" + \"=\"*65)\nprint(\"SC DATASET SUMMARY - WEIGHTED (Population Estimates)\")\nprint(\"=\"*65)\nprint(summary_df.to_string(index=False))\nprint(\"=\"*65)\n\n# Save table\nsummary_df.to_csv('sc_dataset_summary_weighted.csv', index=False)\nprint(\"\\nSummary saved to: sc_dataset_summary_weighted.csv\")"
+   "source": "# Create comprehensive summary table\nsummary_data = {\n    'Metric': [\n        'Household count (weighted)',\n        'Person count (weighted)',\n        'Average household size',\n        'Weighted median household AGI',\n        'Weighted average household AGI',\n        'Weighted median person AGI',\n        'Weighted average person AGI',\n        'Unweighted median household AGI',\n        'Unweighted median person AGI',\n        '25th percentile household AGI',\n        '75th percentile household AGI',\n        '90th percentile household AGI',\n        '95th percentile household AGI',\n        'Max household AGI',\n        'Total households with children',\n        'Households with 1 child',\n        'Households with 2 children',\n        'Households with 3+ children',\n        'Total children under 18',\n        'Children under 6',\n        'Children under 3'\n    ],\n    'Value': [\n        f\"{weighted_household_count:,.0f}\",\n        f\"{weighted_person_count:,.0f}\",\n        f\"{avg_hh_size:.1f}\",\n        f\"${weighted_median_hh:,.0f}\",\n        f\"${weighted_avg_hh:,.0f}\",\n        f\"${weighted_median_person:,.0f}\",\n        f\"${weighted_avg_person:,.0f}\",\n        f\"${unweighted_median_hh:,.0f}\",\n        f\"${unweighted_median_person:,.0f}\",\n        f\"${weighted_percentile(agi_hh_array, hh_weights, 25):,.0f}\",\n        f\"${weighted_percentile(agi_hh_array, hh_weights, 75):,.0f}\",\n        f\"${weighted_percentile(agi_hh_array, hh_weights, 90):,.0f}\",\n        f\"${weighted_percentile(agi_hh_array, hh_weights, 95):,.0f}\",\n        f\"${agi_hh_array.max():,.0f}\",\n        f\"{total_households_with_children:,.0f}\",\n        f\"{households_with_1_child:,.0f}\",\n        f\"{households_with_2_children:,.0f}\",\n        f\"{households_with_3plus_children:,.0f}\",\n        f\"{total_children:,.0f}\",\n        f\"{children_under_6:,.0f}\",\n        f\"{children_under_3:,.0f}\"\n    ]\n}\n\nsummary_df = pd.DataFrame(summary_data)\n\nprint(\"\\n\" + \"=\"*65)\nprint(\"SC DATASET SUMMARY - WEIGHTED (Population Estimates)\")\nprint(\"=\"*65)\nprint(summary_df.to_string(index=False))\nprint(\"=\"*65)\n\n# Save table\nsummary_df.to_csv('sc_dataset_summary_weighted.csv', index=False)\nprint(\"\\nSummary saved to: sc_dataset_summary_weighted.csv\")"
   },
   {
    "cell_type": "code",
-   "execution_count": 8,
+   "execution_count": null,
    "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "======================================================================\n",
-      "HOUSEHOLDS WITH $0 INCOME\n",
-      "======================================================================\n",
-      "Household count: 179,119\n",
-      "Percentage of all households: 9.49%\n",
-      "======================================================================\n"
-     ]
-    }
-   ],
-   "source": [
-    "# Households with $0 income\n",
-    "agi_hh = np.array(sim.calculate(\"adjusted_gross_income\", period=2025, map_to=\"household\"))\n",
-    "weights = np.array(sim.calculate(\"household_weight\", period=2025))\n",
-    "\n",
-    "zero_income_mask = agi_hh == 0\n",
-    "zero_income_count = weights[zero_income_mask].sum()\n",
-    "total_households = weights.sum()\n",
-    "\n",
-    "print(\"\\n\" + \"=\"*70)\n",
-    "print(\"HOUSEHOLDS WITH $0 INCOME\")\n",
-    "print(\"=\"*70)\n",
-    "print(f\"Household count: {zero_income_count:,.0f}\")\n",
-    "print(f\"Percentage of all households: {zero_income_count / total_households * 100:.2f}%\")\n",
-    "print(\"=\"*70)"
-   ]
+   "outputs": [],
+   "source": "# Households with $0 income - using raw arrays\nagi_hh = sim.calculate(\"adjusted_gross_income\", period=2025, map_to=\"household\").values\nweights = sim.calculate(\"household_weight\", period=2025).values\n\nzero_income_mask = agi_hh == 0\nzero_income_count = weights[zero_income_mask].sum()\ntotal_households = weights.sum()\n\nprint(\"\\n\" + \"=\"*70)\nprint(\"HOUSEHOLDS WITH $0 INCOME\")\nprint(\"=\"*70)\nprint(f\"Household count: {zero_income_count:,.0f}\")\nprint(f\"Percentage of all households: {zero_income_count / total_households * 100:.2f}%\")\nprint(\"=\"*70)"
   },
   {
    "cell_type": "code",
diff --git a/us/states/sc/data_exploration_staging.ipynb b/us/states/sc/data_exploration_test.ipynb
similarity index 57%
rename from us/states/sc/data_exploration_staging.ipynb
rename to us/states/sc/data_exploration_test.ipynb
index b797ac0..938545d 100644
--- a/us/states/sc/data_exploration_staging.ipynb
+++ b/us/states/sc/data_exploration_test.ipynb
@@ -5,14 +5,14 @@
    "id": "cell-0",
    "metadata": {},
    "source": [
-    "# SC Dataset Exploration (Staging)\n",
+    "# SC Dataset Exploration (Test - March 2025)\n",
     "\n",
-    "This notebook explores the South Carolina (SC) **staging** dataset to understand household counts, income distribution, and demographic characteristics."
+    "This notebook explores the South Carolina (SC) **test** dataset to understand household counts, income distribution, and demographic characteristics."
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 1,
+   "execution_count": null,
    "id": "cell-1",
    "metadata": {},
    "outputs": [],
@@ -21,114 +21,55 @@
     "import pandas as pd\n",
     "import numpy as np\n",
     "\n",
-    "SC_DATASET = \"hf://policyengine/policyengine-us-data/staging/states/SC.h5\""
+    "SC_DATASET = \"hf://policyengine/test/mar/SC.h5\""
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 2,
+   "execution_count": null,
    "id": "cell-2",
    "metadata": {},
-   "outputs": [
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "Xet Storage is enabled for this repo, but the 'hf_xet' package is not installed. Falling back to regular HTTP download. For better performance, install the package with: `pip install huggingface_hub[hf_xet]` or `pip install hf_xet`\n"
-     ]
-    },
-    {
-     "data": {
-      "application/vnd.jupyter.widget-view+json": {
-       "model_id": "2eb0b3ac0b824f52a3a6066931afc5ac",
-       "version_major": 2,
-       "version_minor": 0
-      },
-      "text/plain": [
-       "SC.h5:   0%|          | 0.00/38.1M [00:00<?, ?B/s]"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    }
-   ],
+   "outputs": [],
    "source": [
-    "# Load SC staging dataset\n",
+    "# Load SC test dataset\n",
     "sim = Microsimulation(dataset=SC_DATASET)"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 3,
+   "execution_count": null,
    "id": "cell-3",
    "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Number of households in dataset: 22,528\n",
-      "Household count (weighted): 1,587,912\n",
-      "Person count (weighted): 4,788,894\n"
-     ]
-    }
-   ],
+   "outputs": [],
    "source": [
-    "# Check dataset size\n",
-    "household_weight = sim.calculate(\"household_weight\", period=2025)\n",
-    "household_count = sim.calculate(\"household_count\", period=2025, map_to=\"household\")\n",
-    "person_count = sim.calculate(\"person_count\", period=2025, map_to=\"household\")\n",
+    "# Check dataset size - use .values to get raw arrays (avoid MicroSeries auto-weighting)\n",
+    "household_weight = sim.calculate(\"household_weight\", period=2025).values\n",
+    "household_count = sim.calculate(\"household_count\", period=2025, map_to=\"household\").values\n",
+    "person_count = sim.calculate(\"person_count\", period=2025, map_to=\"household\").values\n",
+    "\n",
+    "# Weighted sums using raw arrays\n",
+    "weighted_household_count = (household_count * household_weight).sum()\n",
+    "weighted_person_count = (person_count * household_weight).sum()\n",
     "\n",
     "print(f\"Number of households in dataset: {len(household_weight):,}\")\n",
-    "print(f\"Household count (weighted): {household_count.sum():,.0f}\")\n",
-    "print(f\"Person count (weighted): {person_count.sum():,.0f}\")"
+    "print(f\"Household count (weighted): {weighted_household_count:,.0f}\")\n",
+    "print(f\"Person count (weighted): {weighted_person_count:,.0f}\")"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 4,
+   "execution_count": null,
    "id": "cell-4",
    "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "============================================================\n",
-      "INCOME DISTRIBUTION SUMMARY\n",
-      "============================================================\n",
-      "\n",
-      "Household AGI:\n",
-      "  Unweighted median: $67,907\n",
-      "  Weighted median:   $60,378\n",
-      "  Weighted average:  $105,617\n",
-      "\n",
-      "Person AGI:\n",
-      "  Unweighted median: $67,460\n",
-      "  Weighted median:   $56,366\n",
-      "  Weighted average:  $100,583\n",
-      "\n",
-      "Average household size: 3.0\n",
-      "\n",
-      "Weighted household AGI percentiles:\n",
-      "  25th percentile: $27,117\n",
-      "  50th percentile: $60,378\n",
-      "  75th percentile: $105,515\n",
-      "  90th percentile: $153,279\n",
-      "  95th percentile: $237,856\n",
-      "  Max AGI: $353,653,602\n"
-     ]
-    }
-   ],
+   "outputs": [],
    "source": [
     "# Check income distribution (weighted vs unweighted, household and person level)\n",
-    "agi_household = sim.calculate(\"adjusted_gross_income\", period=2025, map_to=\"household\")\n",
-    "agi_hh_array = np.array(agi_household)\n",
-    "hh_weights = np.array(sim.calculate(\"household_weight\", period=2025))\n",
+    "# Use .values to get raw numpy arrays (avoid MicroSeries auto-weighting)\n",
+    "agi_hh_array = sim.calculate(\"adjusted_gross_income\", period=2025, map_to=\"household\").values\n",
+    "hh_weights = sim.calculate(\"household_weight\", period=2025).values\n",
     "\n",
-    "agi_person = sim.calculate(\"adjusted_gross_income\", period=2025, map_to=\"person\")\n",
-    "agi_person_array = np.array(agi_person)\n",
-    "person_weights = np.array(sim.calculate(\"person_weight\", period=2025))\n",
+    "agi_person_array = sim.calculate(\"adjusted_gross_income\", period=2025, map_to=\"person\").values\n",
+    "person_weights = sim.calculate(\"person_weight\", period=2025).values\n",
     "\n",
     "# Weighted percentile calculation\n",
     "def weighted_percentile(values, weights, percentile):\n",
@@ -182,34 +123,21 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 5,
+   "execution_count": null,
    "id": "cell-5",
    "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "Households with children (weighted):\n",
-      "  Total households with children: 637,558\n",
-      "  Households with 1 child: 308,153\n",
-      "  Households with 2 children: 190,106\n",
-      "  Households with 3+ children: 139,299\n"
-     ]
-    }
-   ],
+   "outputs": [],
    "source": [
-    "# Check households with children\n",
-    "is_child = sim.calculate(\"is_child\", period=2025, map_to=\"person\")\n",
-    "household_id = sim.calculate(\"household_id\", period=2025, map_to=\"person\")\n",
-    "household_weight = sim.calculate(\"household_weight\", period=2025, map_to=\"person\")\n",
+    "# Check households with children - use .values for raw arrays\n",
+    "is_child = sim.calculate(\"is_child\", period=2025, map_to=\"person\").values\n",
+    "household_id = sim.calculate(\"household_id\", period=2025, map_to=\"person\").values\n",
+    "household_weight_person = sim.calculate(\"household_weight\", period=2025, map_to=\"person\").values\n",
     "\n",
     "# Create DataFrame\n",
     "df_households = pd.DataFrame({\n",
     "    'household_id': household_id,\n",
     "    'is_child': is_child,\n",
-    "    'household_weight': household_weight\n",
+    "    'household_weight': household_weight_person\n",
     "})\n",
     "\n",
     "# Count children per household\n",
@@ -233,30 +161,18 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 6,
+   "execution_count": null,
    "id": "cell-6",
    "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "Children by age:\n",
-      "  Total children under 18: 1,157,115\n",
-      "  Children under 6: 350,517\n",
-      "  Children under 3: 177,575\n"
-     ]
-    }
-   ],
+   "outputs": [],
    "source": [
-    "# Check children by age groups\n",
+    "# Check children by age groups - use .values for raw arrays\n",
     "df = pd.DataFrame({\n",
-    "    \"household_id\": sim.calculate(\"household_id\", map_to=\"person\"),\n",
-    "    \"tax_unit_id\": sim.calculate(\"tax_unit_id\", map_to=\"person\"),\n",
-    "    \"person_id\": sim.calculate(\"person_id\", map_to=\"person\"),\n",
-    "    \"age\": sim.calculate(\"age\", map_to=\"person\"),\n",
-    "    \"person_weight\": sim.calculate(\"person_weight\", map_to=\"person\")\n",
+    "    \"household_id\": sim.calculate(\"household_id\", map_to=\"person\").values,\n",
+    "    \"tax_unit_id\": sim.calculate(\"tax_unit_id\", map_to=\"person\").values,\n",
+    "    \"person_id\": sim.calculate(\"person_id\", map_to=\"person\").values,\n",
+    "    \"age\": sim.calculate(\"age\", map_to=\"person\").values,\n",
+    "    \"person_weight\": sim.calculate(\"person_weight\", map_to=\"person\").values\n",
     "})\n",
     "\n",
     "# Filter for children and apply weights\n",
@@ -277,46 +193,10 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 7,
+   "execution_count": null,
    "id": "cell-7",
    "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "=================================================================\n",
-      "SC STAGING DATASET SUMMARY - WEIGHTED (Population Estimates)\n",
-      "=================================================================\n",
-      "                         Metric        Value\n",
-      "     Household count (weighted)    1,587,912\n",
-      "        Person count (weighted)    4,788,894\n",
-      "         Average household size          3.0\n",
-      "  Weighted median household AGI      $60,378\n",
-      " Weighted average household AGI     $105,617\n",
-      "     Weighted median person AGI      $56,366\n",
-      "    Weighted average person AGI     $100,583\n",
-      "Unweighted median household AGI      $67,907\n",
-      "   Unweighted median person AGI      $67,460\n",
-      "  25th percentile household AGI      $27,117\n",
-      "  75th percentile household AGI     $105,515\n",
-      "  90th percentile household AGI     $153,279\n",
-      "  95th percentile household AGI     $237,856\n",
-      "              Max household AGI $353,653,602\n",
-      " Total households with children      637,558\n",
-      "        Households with 1 child      308,153\n",
-      "     Households with 2 children      190,106\n",
-      "    Households with 3+ children      139,299\n",
-      "        Total children under 18    1,157,115\n",
-      "               Children under 6      350,517\n",
-      "               Children under 3      177,575\n",
-      "=================================================================\n",
-      "\n",
-      "Summary saved to: sc_staging_dataset_summary_weighted.csv\n"
-     ]
-    }
-   ],
+   "outputs": [],
    "source": [
     "# Create comprehensive summary table\n",
     "summary_data = {\n",
@@ -344,8 +224,8 @@
     "        'Children under 3'\n",
     "    ],\n",
     "    'Value': [\n",
-    "        f\"{household_count.sum():,.0f}\",\n",
-    "        f\"{person_count.sum():,.0f}\",\n",
+    "        f\"{weighted_household_count:,.0f}\",\n",
+    "        f\"{weighted_person_count:,.0f}\",\n",
     "        f\"{avg_hh_size:.1f}\",\n",
     "        f\"${weighted_median_hh:,.0f}\",\n",
     "        f\"${weighted_avg_hh:,.0f}\",\n",
@@ -371,40 +251,26 @@
     "summary_df = pd.DataFrame(summary_data)\n",
     "\n",
     "print(\"\\n\" + \"=\"*65)\n",
-    "print(\"SC STAGING DATASET SUMMARY - WEIGHTED (Population Estimates)\")\n",
+    "print(\"SC TEST DATASET SUMMARY - WEIGHTED (Population Estimates)\")\n",
     "print(\"=\"*65)\n",
     "print(summary_df.to_string(index=False))\n",
     "print(\"=\"*65)\n",
     "\n",
     "# Save table\n",
-    "summary_df.to_csv('sc_staging_dataset_summary_weighted.csv', index=False)\n",
-    "print(\"\\nSummary saved to: sc_staging_dataset_summary_weighted.csv\")"
+    "summary_df.to_csv('sc_test_dataset_summary_weighted.csv', index=False)\n",
+    "print(\"\\nSummary saved to: sc_test_dataset_summary_weighted.csv\")"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 8,
+   "execution_count": null,
    "id": "cell-8",
    "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "======================================================================\n",
-      "HOUSEHOLDS WITH $0 INCOME\n",
-      "======================================================================\n",
-      "Household count: 9,513\n",
-      "Percentage of all households: 0.60%\n",
-      "======================================================================\n"
-     ]
-    }
-   ],
+   "outputs": [],
    "source": [
-    "# Households with $0 income\n",
-    "agi_hh = np.array(sim.calculate(\"adjusted_gross_income\", period=2025, map_to=\"household\"))\n",
-    "weights = np.array(sim.calculate(\"household_weight\", period=2025))\n",
+    "# Households with $0 income - using raw arrays\n",
+    "agi_hh = sim.calculate(\"adjusted_gross_income\", period=2025, map_to=\"household\").values\n",
+    "weights = sim.calculate(\"household_weight\", period=2025).values\n",
     "\n",
     "zero_income_mask = agi_hh == 0\n",
     "zero_income_count = weights[zero_income_mask].sum()\n",
@@ -420,32 +286,10 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 9,
+   "execution_count": null,
    "id": "cell-9",
    "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "======================================================================\n",
-      "HOUSEHOLD COUNTS BY INCOME BRACKET\n",
-      "======================================================================\n",
-      "Income Bracket Households % of All Households\n",
-      "       $0-$10k    136,673               8.61%\n",
-      "     $10k-$20k    154,618               9.74%\n",
-      "     $20k-$30k    148,652               9.36%\n",
-      "     $30k-$40k    125,157               7.88%\n",
-      "     $40k-$50k    121,742               7.67%\n",
-      "     $50k-$60k    101,082               6.37%\n",
-      "======================================================================\n",
-      "\n",
-      "Total households in $0-$60k range: 787,925\n",
-      "Percentage of all households in $0-$60k range: 49.62%\n"
-     ]
-    }
-   ],
+   "outputs": [],
    "source": [
     "# Household counts by income brackets\n",
     "income_brackets = [\n",
@@ -491,16 +335,8 @@
    "name": "python3"
   },
   "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
    "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.11.5"
+   "version": "3.11.0"
   }
  },
  "nbformat": 4,
diff --git a/us/states/sc/sc_h4216_budget_impact.py b/us/states/sc/sc_h4216_budget_impact.py
index be53250..bf80b03 100644
--- a/us/states/sc/sc_h4216_budget_impact.py
+++ b/us/states/sc/sc_h4216_budget_impact.py
@@ -8,7 +8,7 @@
 from policyengine_core.reforms import Reform
 import numpy as np
 
-SC_DATASET = "hf://policyengine/policyengine-us-data/staging/states/SC.h5"
+SC_DATASET = "hf://policyengine/test/mar/SC.h5"
 TAX_YEAR = 2026
 
 def create_h4216_reform():
@@ -58,9 +58,9 @@ def create_h4216_reform():
 print(f"\nBaseline SC Income Tax Revenue: ${baseline_revenue:,.0f}")
 print(f"Reform SC Income Tax Revenue:   ${reform_revenue:,.0f}")
 print(f"\n>>> BUDGET IMPACT: ${budget_impact:,.0f} <<<")
-print(f"\nRFA Estimate: -$119,100,000")
-print(f"Difference from RFA: ${budget_impact - (-119100000):,.0f}")
-print(f"Accuracy: {(1 - abs(budget_impact - (-119100000)) / 119100000) * 100:.1f}%")
+print(f"\nRFA Estimate (5.21%): -$309,000,000")
+print(f"Difference from RFA: ${budget_impact - (-309000000):,.0f}")
+print(f"Accuracy: {(1 - abs(budget_impact - (-309000000)) / 309000000) * 100:.1f}%")
 print("\n" + "-"*60)
 print(f"Tax units with DECREASE: {pct_decrease:.1f}%")
 print(f"Tax units with INCREASE: {pct_increase:.1f}%")
diff --git a/us/states/sc/sc_h4216_dataset_comparison.py b/us/states/sc/sc_h4216_dataset_comparison.py
new file mode 100644
index 0000000..da89d35
--- /dev/null
+++ b/us/states/sc/sc_h4216_dataset_comparison.py
@@ -0,0 +1,92 @@
+"""
+SC H.4216 Budget Impact Comparison Across Datasets
+Compares budgetary impacts using production, staging, and test datasets.
+"""
+
+from policyengine_us import Microsimulation
+from policyengine_us.reforms.states.sc.h4216.sc_h4216 import create_sc_h4216
+from policyengine_core.reforms import Reform
+import numpy as np
+
+TAX_YEAR = 2026
+
+DATASETS = {
+    "Production": "hf://policyengine/policyengine-us-data/states/SC.h5",
+    "Test (Mar)": "hf://policyengine/test/mar/SC.h5"
+}
+
+def create_h4216_reform(top_rate=0.0521):
+    param_reform = Reform.from_dict(
+        {
+            "gov.contrib.states.sc.h4216.in_effect": {
+                "2026-01-01.2100-12-31": True
+            },
+            "gov.contrib.states.sc.h4216.rates[1].rate": {
+                "2026-01-01.2100-12-31": top_rate
+            }
+        },
+        country_id="us",
+    )
+    base_reform = create_sc_h4216()
+    return (base_reform, param_reform)
+
+def calculate_impact(dataset_path, top_rate):
+    """Calculate budget impact for a given dataset and top rate."""
+    baseline = Microsimulation(dataset=dataset_path)
+    reform = create_h4216_reform(top_rate=top_rate)
+    reform_sim = Microsimulation(dataset=dataset_path, reform=reform)
+
+    baseline_tax = baseline.calculate("sc_income_tax", period=TAX_YEAR, map_to="tax_unit").values
+    reform_tax = reform_sim.calculate("sc_income_tax", period=TAX_YEAR, map_to="tax_unit").values
+    weight = baseline.calculate("tax_unit_weight", period=TAX_YEAR).values
+
+    tax_change = reform_tax - baseline_tax
+    budget_impact = (tax_change * weight).sum()
+    total_units = weight.sum()
+    baseline_revenue = (baseline_tax * weight).sum()
+
+    return {
+        "budget_impact": budget_impact,
+        "total_units": total_units,
+        "baseline_revenue": baseline_revenue
+    }
+
+# Run analysis
+results = {}
+for name, path in DATASETS.items():
+    print(f"\nProcessing {name}...")
+    results[name] = {
+        "5.21%": calculate_impact(path, 0.0521),
+        "5.39%": calculate_impact(path, 0.0539)
+    }
+    print(f"  Done!")
+
+# Print results
+print("\n" + "="*90)
+print("SC H.4216 BUDGET IMPACT COMPARISON ACROSS DATASETS")
+print("="*90)
+
+print(f"\n{'Dataset':<15} {'Tax Units':>15} {'Baseline Rev':>18} {'5.21% Impact':>18} {'5.39% Impact':>18}")
+print("-"*90)
+
+for name in DATASETS.keys():
+    r = results[name]
+    print(f"{name:<15} {r['5.21%']['total_units']:>15,.0f} ${r['5.21%']['baseline_revenue']:>16,.0f} ${r['5.21%']['budget_impact']:>16,.0f} ${r['5.39%']['budget_impact']:>16,.0f}")
+
+print("-"*90)
+print(f"{'RFA Estimate':<15} {'2,757,573':>15} {'N/A':>18} ${-309000000:>16,.0f} ${-119100000:>16,.0f}")
+print("="*90)
+
+# Accuracy comparison
+print("\n" + "="*90)
+print("ACCURACY vs RFA")
+print("="*90)
+print(f"{'Dataset':<15} {'5.21% PE':>15} {'vs RFA -$309M':>18} {'5.39% PE':>15} {'vs RFA -$119M':>18}")
+print("-"*90)
+for name in DATASETS.keys():
+    impact_521 = results[name]["5.21%"]["budget_impact"]
+    impact_539 = results[name]["5.39%"]["budget_impact"]
+    acc_521 = (1 - abs(impact_521 - (-309000000)) / 309000000) * 100
+    acc_539 = (1 - abs(impact_539 - (-119100000)) / 119100000) * 100
+    print(f"{name:<15} ${impact_521:>14,.0f} {acc_521:>16.1f}% ${impact_539:>14,.0f} {acc_539:>16.1f}%")
+print("="*90)
diff --git a/us/states/sc/sc_h4216_reform_analysis.ipynb b/us/states/sc/sc_h4216_reform_analysis.ipynb
index 9e7cbf2..5d8bf26 100644
--- a/us/states/sc/sc_h4216_reform_analysis.ipynb
+++ b/us/states/sc/sc_h4216_reform_analysis.ipynb
@@ -39,19 +39,10 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 1,
+   "execution_count": null,
    "metadata": {},
    "outputs": [],
-   "source": [
-    "from policyengine_us import Microsimulation\n",
-    "from policyengine_us.reforms.states.sc.h4216.sc_h4216 import create_sc_h4216\n",
-    "from policyengine_core.reforms import Reform\n",
-    "import pandas as pd\n",
-    "import numpy as np\n",
-    "\n",
-    "SC_DATASET = \"hf://policyengine/policyengine-us-data/staging/states/SC.h5\"\n",
-    "TAX_YEAR = 2026  # Renamed to avoid conflict with YEAR constant from model_api"
-   ]
+   "source": "from policyengine_us import Microsimulation\nfrom policyengine_us.reforms.states.sc.h4216.sc_h4216 import create_sc_h4216\nfrom policyengine_core.reforms import Reform\nimport pandas as pd\nimport numpy as np\n\nSC_DATASET = \"hf://policyengine/test/mar/SC.h5\"\nTAX_YEAR = 2026  # Renamed to avoid conflict with YEAR constant from model_api"
   },
   {
    "cell_type": "code",
@@ -106,7 +97,34 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Loading baseline (current SC tax law)...\n",
+      "Loading baseline (current SC tax law)...\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Xet Storage is enabled for this repo, but the 'hf_xet' package is not installed. Falling back to regular HTTP download. For better performance, install the package with: `pip install huggingface_hub[hf_xet]` or `pip install hf_xet`\n"
+     ]
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "eddcbb760af5468b94382e107443581b",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "SC.h5:   0%|          | 0.00/52.8M [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
       "Baseline loaded\n",
       "\n",
       "Loading reform (H.4216 with 5.39% top rate)...\n",
@@ -149,8 +167,8 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Total tax units: 33,248\n",
-      "Weighted tax units (returns): 1,905,181\n"
+      "Total tax units: 48,461\n",
+      "Weighted tax units (returns): 3,204,719\n"
      ]
     }
    ],
@@ -373,11 +391,11 @@
       "====================================================================================================\n",
       "\n",
       "Impact: With this tax structure:\n",
-      "  - 29.7% of taxpayers have a LOWER tax liability\n",
-      "  - 26.8% of taxpayers have a HIGHER tax liability\n",
-      "  - 43.5% are UNCHANGED\n",
+      "  - 33.1% of taxpayers have a LOWER tax liability\n",
+      "  - 25.1% of taxpayers have a HIGHER tax liability\n",
+      "  - 41.8% are UNCHANGED\n",
       "\n",
-      "General Fund Impact: $-110,942,720\n",
+      "General Fund Impact: $-14,654,645,248\n",
       "====================================================================================================\n"
      ]
     }
@@ -415,21 +433,21 @@
      "output_type": "stream",
      "text": [
       "     Federal AGI Range  Est. # Returns  % of Returns  Old Avg Tax  New Avg Tax  Total Change ($)  Decrease #  Decrease %  Increase #  Increase %  No Change %  Zero Tax %\n",
-      "                   $0*           58352           3.1            0            0                 0           0    0.000000           0    0.000000   100.000000  100.000000\n",
-      "         $1 to $10,000          168000           8.8            0            0                 0           0    0.000000           0    0.000000   100.000000  100.000000\n",
-      "    $10,001 to $20,000          205689          10.8            0            3            697809           0    0.000000       12906    6.300000    93.699997   93.699997\n",
-      "    $20,001 to $30,000          226431          11.9           33           45           2860578        1427    0.600000       51406   22.700001    76.699997   75.699997\n",
-      "    $30,001 to $40,000          174753           9.2          182          156          -4382816       57708   33.000000       22397   12.800000    54.200001   53.900002\n",
-      "    $40,001 to $50,000          155837           8.2          319          244         -11700509       48322   31.000000       44468   28.500000    40.500000   40.500000\n",
-      "    $50,001 to $75,000          262861          13.8          581          475         -27688580      136898   52.099998       77200   29.400000    18.600000   18.600000\n",
-      "   $75,001 to $100,000          215040          11.3         1338         1161         -38227128      138525   64.400002       50694   23.600000    12.000000   12.300000\n",
-      "  $100,001 to $150,000          278127          14.6         2928         3130          56022196      118122   42.500000      156517   56.299999     1.300000    1.000000\n",
-      "  $150,001 to $200,000           49870           2.6         5124         5814          34402136        1551    3.100000       48319   96.900002     0.000000    0.000000\n",
-      "  $200,001 to $300,000           40779           2.1         9149         9707          22764908        2048    5.000000       38672   94.800003     0.100000    0.000000\n",
-      "  $300,001 to $500,000           42814           2.2        17785        17299         -20835856       35387   82.699997        6631   15.500000     1.900000    1.900000\n",
-      "$500,001 to $1,000,000           13719           0.7        27237        26665          -7850124       13076   95.300003         643    4.700000     0.000000    0.000000\n",
-      "       Over $1,000,000           12909           0.7       113354       104291        -117005352       12703   98.400002         206    1.600000     0.000000    0.000000\n",
-      "                 Total         1905181         100.0         2399         2341        -110942720      565768   29.700001      510059   26.799999    43.500000   43.400002\n"
+      "                   $0*          369521          11.5            0            0                 0           0    0.000000           0    0.000000   100.000000  100.000000\n",
+      "         $1 to $10,000          406965          12.7            0            0                 0           0    0.000000           0    0.000000   100.000000  100.000000\n",
+      "    $10,001 to $20,000          295746           9.2            0           11           3145121           0    0.000000       64066   21.700001    78.300003   78.199997\n",
+      "    $20,001 to $30,000          278678           8.7           67           96           8096652        9396    3.400000      127046   45.599998    51.000000   50.799999\n",
+      "    $30,001 to $40,000          252815           7.9          289          243         -11809976      135818   53.700001       39744   15.700000    30.600000   30.200001\n",
+      "    $40,001 to $50,000          204601           6.4          632          459         -35389328      118222   57.799999       47018   23.000000    19.200001   19.200001\n",
+      "    $50,001 to $75,000          407221          12.7         1214         1073         -57309672      273530   67.199997       78571   19.299999    13.500000   13.500000\n",
+      "   $75,001 to $100,000          253742           7.9         2078         2056          -5720177      149558   58.900002       90703   35.700001     5.300000    4.900000\n",
+      "  $100,001 to $150,000          310561           9.7         3694         3875          56132876      147042   47.299999      160837   51.799999     0.900000    0.500000\n",
+      "  $150,001 to $200,000          145460           4.5         6365         6796          62730072       31526   21.700001      113934   78.300003     0.000000    0.000000\n",
+      "  $200,001 to $300,000          100241           3.1         9594        10054          46091116       38119   38.000000       60974   60.799999     1.100000    1.100000\n",
+      "  $300,001 to $500,000          103531           3.2        16932        16233         -72464000       91344   88.199997       11782   11.400000     0.400000    0.400000\n",
+      "$500,001 to $1,000,000           19045           0.6        27051        25511         -29327746       16469   86.500000        2249   11.800000     1.700000    1.700000\n",
+      "       Over $1,000,000           56592           1.8      4277978      4019660      -14618820608       49508   87.500000        7084   12.500000     0.000000    0.000000\n",
+      "                 Total         3204719         100.0        77588        73015      -14654645248     1060532   33.099998      804008   25.100000    41.799999   41.700001\n"
      ]
     }
    ],
@@ -497,21 +515,21 @@
       "ESTIMATED TAX RETURN DISTRIBUTION\n",
       "================================================================================\n",
       "     Federal AGI Range  Est. # Returns  % of Returns  Old Avg Tax  New Avg Tax\n",
-      "                   $0*           58352           3.1            0            0\n",
-      "         $1 to $10,000          168000           8.8            0            0\n",
-      "    $10,001 to $20,000          205689          10.8            0            3\n",
-      "    $20,001 to $30,000          226431          11.9           33           45\n",
-      "    $30,001 to $40,000          174753           9.2          182          156\n",
-      "    $40,001 to $50,000          155837           8.2          319          244\n",
-      "    $50,001 to $75,000          262861          13.8          581          475\n",
-      "   $75,001 to $100,000          215040          11.3         1338         1161\n",
-      "  $100,001 to $150,000          278127          14.6         2928         3130\n",
-      "  $150,001 to $200,000           49870           2.6         5124         5814\n",
-      "  $200,001 to $300,000           40779           2.1         9149         9707\n",
-      "  $300,001 to $500,000           42814           2.2        17785        17299\n",
-      "$500,001 to $1,000,000           13719           0.7        27237        26665\n",
-      "       Over $1,000,000           12909           0.7       113354       104291\n",
-      "                 Total         1905181         100.0         2399         2341\n"
+      "                   $0*          369521          11.5            0            0\n",
+      "         $1 to $10,000          406965          12.7            0            0\n",
+      "    $10,001 to $20,000          295746           9.2            0           11\n",
+      "    $20,001 to $30,000          278678           8.7           67           96\n",
+      "    $30,001 to $40,000          252815           7.9          289          243\n",
+      "    $40,001 to $50,000          204601           6.4          632          459\n",
+      "    $50,001 to $75,000          407221          12.7         1214         1073\n",
+      "   $75,001 to $100,000          253742           7.9         2078         2056\n",
+      "  $100,001 to $150,000          310561           9.7         3694         3875\n",
+      "  $150,001 to $200,000          145460           4.5         6365         6796\n",
+      "  $200,001 to $300,000          100241           3.1         9594        10054\n",
+      "  $300,001 to $500,000          103531           3.2        16932        16233\n",
+      "$500,001 to $1,000,000           19045           0.6        27051        25511\n",
+      "       Over $1,000,000           56592           1.8      4277978      4019660\n",
+      "                 Total         3204719         100.0        77588        73015\n"
      ]
     }
    ],
@@ -541,18 +559,18 @@
       "                   $0*           0    0.000000                   0             0\n",
       "         $1 to $10,000           0    0.000000                   0             0\n",
       "    $10,001 to $20,000           0    0.000000                   0             0\n",
-      "    $20,001 to $30,000        1427    0.600000               -8402            -6\n",
-      "    $30,001 to $40,000       57708   33.000000            -5940918          -103\n",
-      "    $40,001 to $50,000       48322   31.000000           -15560643          -322\n",
-      "    $50,001 to $75,000      136898   52.099998           -37521040          -274\n",
-      "   $75,001 to $100,000      138525   64.400002           -52849696          -382\n",
-      "  $100,001 to $150,000      118122   42.500000           -19568998          -166\n",
-      "  $150,001 to $200,000        1551    3.100000             -380708          -246\n",
-      "  $200,001 to $300,000        2048    5.000000             -201820           -99\n",
-      "  $300,001 to $500,000       35387   82.699997           -24901672          -704\n",
-      "$500,001 to $1,000,000       13076   95.300003           -19588270         -1498\n",
-      "       Over $1,000,000       12703   98.400002          -128537088        -10118\n",
-      "                 Total      565768   29.700001          -305059264          -539\n"
+      "    $20,001 to $30,000        9396    3.400000              -50358            -5\n",
+      "    $30,001 to $40,000      135818   53.700001           -14845139          -109\n",
+      "    $40,001 to $50,000      118222   57.799999           -39889976          -337\n",
+      "    $50,001 to $75,000      273530   67.199997           -73336032          -268\n",
+      "   $75,001 to $100,000      149558   58.900002           -36993168          -247\n",
+      "  $100,001 to $150,000      147042   47.299999           -22048396          -150\n",
+      "  $150,001 to $200,000       31526   21.700001           -11001782          -349\n",
+      "  $200,001 to $300,000       38119   38.000000           -21143300          -555\n",
+      "  $300,001 to $500,000       91344   88.199997           -93526784         -1024\n",
+      "$500,001 to $1,000,000       16469   86.500000           -35028512         -2127\n",
+      "       Over $1,000,000       49508   87.500000        -17806082048       -359664\n",
+      "                 Total     1060532   33.099998        -18153947136        -17118\n"
      ]
     }
    ],
@@ -581,19 +599,19 @@
       "     Federal AGI Range  Increase #  Increase %  Total Increase ($)  Avg Increase\n",
       "                   $0*           0    0.000000                   0             0\n",
       "         $1 to $10,000           0    0.000000                   0             0\n",
-      "    $10,001 to $20,000       12906    6.300000              697809            54\n",
-      "    $20,001 to $30,000       51406   22.700001             2871184            56\n",
-      "    $30,001 to $40,000       22397   12.800000             1558448            70\n",
-      "    $40,001 to $50,000       44468   28.500000             3860133            87\n",
-      "    $50,001 to $75,000       77200   29.400000             9832463           127\n",
-      "   $75,001 to $100,000       50694   23.600000            14622566           288\n",
-      "  $100,001 to $150,000      156517   56.299999            75591424           483\n",
-      "  $150,001 to $200,000       48319   96.900002            34782844           720\n",
-      "  $200,001 to $300,000       38672   94.800003            22966736           594\n",
-      "  $300,001 to $500,000        6631   15.500000             4065817           613\n",
-      "$500,001 to $1,000,000         643    4.700000            11738147         18254\n",
-      "       Over $1,000,000         206    1.600000            11531744         56085\n",
-      "                 Total      510059   26.799999           194119312           381\n"
+      "    $10,001 to $20,000       64066   21.700001             3144930            49\n",
+      "    $20,001 to $30,000      127046   45.599998             8146672            64\n",
+      "    $30,001 to $40,000       39744   15.700000             3035304            76\n",
+      "    $40,001 to $50,000       47018   23.000000             4500647            96\n",
+      "    $50,001 to $75,000       78571   19.299999            16026354           204\n",
+      "   $75,001 to $100,000       90703   35.700001            31273924           345\n",
+      "  $100,001 to $150,000      160837   51.799999            78180864           486\n",
+      "  $150,001 to $200,000      113934   78.300003            73731856           647\n",
+      "  $200,001 to $300,000       60974   60.799999            67234448          1103\n",
+      "  $300,001 to $500,000       11782   11.400000            21062782          1788\n",
+      "$500,001 to $1,000,000        2249   11.800000             5700766          2534\n",
+      "       Over $1,000,000        7084   12.500000          3187261952        449920\n",
+      "                 Total      804008   25.100000          3499300352          4352\n"
      ]
     }
    ],
@@ -620,21 +638,21 @@
       "TAX RETURNS WITH NO CHANGE / ZERO TAX LIABILITY\n",
       "================================================================================\n",
       "     Federal AGI Range  No Change #  No Change %  Zero Tax #  Zero Tax %\n",
-      "                   $0*        58352   100.000000       58352  100.000000\n",
-      "         $1 to $10,000       168000   100.000000      168000  100.000000\n",
-      "    $10,001 to $20,000       192783    93.699997      192783   93.699997\n",
-      "    $20,001 to $30,000       173597    76.699997      171348   75.699997\n",
-      "    $30,001 to $40,000        94648    54.200001       94228   53.900002\n",
-      "    $40,001 to $50,000        63047    40.500000       63047   40.500000\n",
-      "    $50,001 to $75,000        48763    18.600000       48850   18.600000\n",
-      "   $75,001 to $100,000        25821    12.000000       26375   12.300000\n",
-      "  $100,001 to $150,000         3487     1.300000        2748    1.000000\n",
+      "                   $0*       369521   100.000000      369521  100.000000\n",
+      "         $1 to $10,000       406965   100.000000      406965  100.000000\n",
+      "    $10,001 to $20,000       231681    78.300003      231347   78.199997\n",
+      "    $20,001 to $30,000       142236    51.000000      141555   50.799999\n",
+      "    $30,001 to $40,000        77253    30.600000       76459   30.200001\n",
+      "    $40,001 to $50,000        39362    19.200001       39362   19.200001\n",
+      "    $50,001 to $75,000        55120    13.500000       55120   13.500000\n",
+      "   $75,001 to $100,000        13480     5.300000       12472    4.900000\n",
+      "  $100,001 to $150,000         2682     0.900000        1604    0.500000\n",
       "  $150,001 to $200,000            0     0.000000           0    0.000000\n",
-      "  $200,001 to $300,000           59     0.100000           0    0.000000\n",
-      "  $300,001 to $500,000          796     1.900000         796    1.900000\n",
-      "$500,001 to $1,000,000            0     0.000000           0    0.000000\n",
-      "       Over $1,000,000            0     0.000000           0    0.000000\n",
-      "                 Total       829354    43.500000      826527   43.400002\n"
+      "  $200,001 to $300,000         1147     1.100000        1069    1.100000\n",
+      "  $300,001 to $500,000          405     0.400000         405    0.400000\n",
+      "$500,001 to $1,000,000          326     1.700000         326    1.700000\n",
+      "       Over $1,000,000            1     0.000000           1    0.000000\n",
+      "                 Total      1340179    41.799999     1336206   41.700001\n"
      ]
     }
    ],
@@ -676,15 +694,15 @@
       "\n",
       "General Fund Impact:\n",
       "  RFA Estimate:          $   -238,151,000\n",
-      "  PolicyEngine Estimate: $   -110,942,720\n",
-      "  Difference:            $    127,208,280\n",
+      "  PolicyEngine Estimate: $-14,654,645,248\n",
+      "  Difference:            $-14,416,494,248\n",
       "\n",
-      "  Accuracy vs RFA: 46.6%\n",
+      "  Accuracy vs RFA: -5953.5%\n",
       "\n",
       "Total Returns:\n",
       "  RFA:             5,515,148\n",
-      "  PolicyEngine:    1,905,181\n",
-      "  Difference:     -3,609,967\n"
+      "  PolicyEngine:    3,204,719\n",
+      "  Difference:     -2,310,428\n"
      ]
     }
    ],
@@ -736,21 +754,21 @@
       "================================================================================\n",
       "IMPACT BY INCOME BRACKET: PolicyEngine vs RFA\n",
       "================================================================================\n",
-      "             AGI Range  PE Returns  RFA Returns  PE Impact  RFA Impact     Diff ($)\n",
-      "                   $0*       58352        78854          0   -571000.0     571000.0\n",
-      "         $1 to $10,000      168000            0          0         0.0          0.0\n",
-      "    $10,001 to $20,000      205689            0     697809         0.0     697809.0\n",
-      "    $20,001 to $30,000      226431            0    2860578         0.0    2860578.0\n",
-      "    $30,001 to $40,000      174753            0   -4382816         0.0   -4382816.0\n",
-      "    $40,001 to $50,000      155837            0  -11700509         0.0  -11700509.0\n",
-      "    $50,001 to $75,000      262861            0  -27688580         0.0  -27688580.0\n",
-      "   $75,001 to $100,000      215040            0  -38227128         0.0  -38227128.0\n",
-      "  $100,001 to $150,000      278127            0   56022196         0.0   56022196.0\n",
-      "  $150,001 to $200,000       49870            0   34402136         0.0   34402136.0\n",
-      "  $200,001 to $300,000       40779            0   22764908         0.0   22764908.0\n",
-      "  $300,001 to $500,000       42814            0  -20835856         0.0  -20835856.0\n",
-      "$500,001 to $1,000,000       13719            0   -7850124         0.0   -7850124.0\n",
-      "       Over $1,000,000       12909            0 -117005352         0.0 -117005352.0\n"
+      "             AGI Range  PE Returns  RFA Returns    PE Impact  RFA Impact      Diff ($)\n",
+      "                   $0*      369521        78854            0   -571000.0  5.710000e+05\n",
+      "         $1 to $10,000      406965            0            0         0.0  0.000000e+00\n",
+      "    $10,001 to $20,000      295746            0      3145121         0.0  3.145121e+06\n",
+      "    $20,001 to $30,000      278678            0      8096652         0.0  8.096652e+06\n",
+      "    $30,001 to $40,000      252815            0    -11809976         0.0 -1.180998e+07\n",
+      "    $40,001 to $50,000      204601            0    -35389328         0.0 -3.538933e+07\n",
+      "    $50,001 to $75,000      407221            0    -57309672         0.0 -5.730967e+07\n",
+      "   $75,001 to $100,000      253742            0     -5720177         0.0 -5.720177e+06\n",
+      "  $100,001 to $150,000      310561            0     56132876         0.0  5.613288e+07\n",
+      "  $150,001 to $200,000      145460            0     62730072         0.0  6.273007e+07\n",
+      "  $200,001 to $300,000      100241            0     46091116         0.0  4.609112e+07\n",
+      "  $300,001 to $500,000      103531            0    -72464000         0.0 -7.246400e+07\n",
+      "$500,001 to $1,000,000       19045            0    -29327746         0.0 -2.932775e+07\n",
+      "       Over $1,000,000       56592            0 -14618820608         0.0 -1.461882e+10\n"
      ]
     }
    ],
@@ -810,4 +828,4 @@
  },
  "nbformat": 4,
  "nbformat_minor": 4
-}
+}
\ No newline at end of file
diff --git a/us/states/sc/sc_h4216_tax_impact_analysis.csv b/us/states/sc/sc_h4216_tax_impact_analysis.csv
index 79ed7e3..ba8d6d7 100644
--- a/us/states/sc/sc_h4216_tax_impact_analysis.csv
+++ b/us/states/sc/sc_h4216_tax_impact_analysis.csv
@@ -1,16 +1,16 @@
 Federal AGI Range,Est. # Returns,% of Returns,Old Avg Tax,New Avg Tax,Returns w/ Change,% w/ Change,Avg Change,Total Change ($),Decrease #,Decrease %,Total Decrease ($),Avg Decrease,Increase #,Increase %,Total Increase ($),Avg Increase,No Change #,No Change %,Zero Tax #,Zero Tax %
-$0*,58352,3.0999999046325684,0,0,0,0.0,0,0,0,0.0,0,0,0,0.0,0,0,58352,100.0,58352,100.0
-"$1 to $10,000",168000,8.800000190734863,0,0,0,0.0,0,0,0,0.0,0,0,0,0.0,0,0,168000,100.0,168000,100.0
-"$10,001 to $20,000",205689,10.800000190734863,0,3,12906,6.3,54,697809,0,0.0,0,0,12906,6.3,697809,54,192783,93.7,192783,93.7
-"$20,001 to $30,000",226431,11.899999618530273,33,45,52834,23.3,54,2860578,1427,0.6,-8402,-6,51406,22.7,2871184,56,173597,76.7,171348,75.7
-"$30,001 to $40,000",174753,9.199999809265137,182,156,80105,45.8,-55,-4382816,57708,33.0,-5940918,-103,22397,12.8,1558448,70,94648,54.2,94228,53.9
-"$40,001 to $50,000",155837,8.199999809265137,319,244,92790,59.5,-126,-11700509,48322,31.0,-15560643,-322,44468,28.5,3860133,87,63047,40.5,63047,40.5
-"$50,001 to $75,000",262861,13.800000190734863,581,475,214098,81.4,-129,-27688580,136898,52.1,-37521040,-274,77200,29.4,9832463,127,48763,18.6,48850,18.6
-"$75,001 to $100,000",215040,11.300000190734863,1338,1161,189218,88.0,-202,-38227128,138525,64.4,-52849696,-382,50694,23.6,14622566,288,25821,12.0,26375,12.3
-"$100,001 to $150,000",278127,14.600000381469727,2928,3130,274640,98.7,204,56022196,118122,42.5,-19568998,-166,156517,56.3,75591424,483,3487,1.3,2748,1.0
-"$150,001 to $200,000",49870,2.5999999046325684,5124,5814,49870,100.0,690,34402136,1551,3.1,-380708,-246,48319,96.9,34782844,720,0,0.0,0,0.0
-"$200,001 to $300,000",40779,2.0999999046325684,9149,9707,40720,99.9,559,22764908,2048,5.0,-201820,-99,38672,94.8,22966736,594,59,0.1,0,0.0
-"$300,001 to $500,000",42814,2.200000047683716,17785,17299,42018,98.1,-496,-20835856,35387,82.7,-24901672,-704,6631,15.5,4065817,613,796,1.9,796,1.9
-"$500,001 to $1,000,000",13719,0.699999988079071,27237,26665,13719,100.0,-572,-7850124,13076,95.3,-19588270,-1498,643,4.7,11738147,18254,0,0.0,0,0.0
-"Over $1,000,000",12909,0.699999988079071,113354,104291,12909,100.0,-9064,-117005352,12703,98.4,-128537088,-10118,206,1.6,11531744,56085,0,0.0,0,0.0
-Total,1905181,100.0,2399,2341,1075827,56.5,-58,-110942720,565768,29.7,-305059264,-539,510059,26.8,194119312,381,829354,43.5,826527,43.4
+$0*,369521,11.5,0,0,0,0.0,0,0,0,0.0,0,0,0,0.0,0,0,369521,100.0,369521,100.0
+"$1 to $10,000",406965,12.699999809265137,0,0,0,0.0,0,0,0,0.0,0,0,0,0.0,0,0,406965,100.0,406965,100.0
+"$10,001 to $20,000",295746,9.199999809265137,0,11,64066,21.7,49,3145121,0,0.0,0,0,64066,21.7,3144930,49,231681,78.3,231347,78.2
+"$20,001 to $30,000",278678,8.699999809265137,67,96,136442,49.0,59,8096652,9396,3.4,-50358,-5,127046,45.6,8146672,64,142236,51.0,141555,50.8
+"$30,001 to $40,000",252815,7.900000095367432,289,243,175562,69.4,-67,-11809976,135818,53.7,-14845139,-109,39744,15.7,3035304,76,77253,30.6,76459,30.2
+"$40,001 to $50,000",204601,6.400000095367432,632,459,165240,80.8,-214,-35389328,118222,57.8,-39889976,-337,47018,23.0,4500647,96,39362,19.2,39362,19.2
+"$50,001 to $75,000",407221,12.699999809265137,1214,1073,352101,86.5,-163,-57309672,273530,67.2,-73336032,-268,78571,19.3,16026354,204,55120,13.5,55120,13.5
+"$75,001 to $100,000",253742,7.900000095367432,2078,2056,240262,94.7,-24,-5720177,149558,58.9,-36993168,-247,90703,35.7,31273924,345,13480,5.3,12472,4.9
+"$100,001 to $150,000",310561,9.699999809265137,3694,3875,307879,99.1,182,56132876,147042,47.3,-22048396,-150,160837,51.8,78180864,486,2682,0.9,1604,0.5
+"$150,001 to $200,000",145460,4.5,6365,6796,145460,100.0,431,62730072,31526,21.7,-11001782,-349,113934,78.3,73731856,647,0,0.0,0,0.0
+"$200,001 to $300,000",100241,3.0999999046325684,9594,10054,99094,98.9,465,46091116,38119,38.0,-21143300,-555,60974,60.8,67234448,1103,1147,1.1,1069,1.1
+"$300,001 to $500,000",103531,3.200000047683716,16932,16233,103126,99.6,-703,-72464000,91344,88.2,-93526784,-1024,11782,11.4,21062782,1788,405,0.4,405,0.4
+"$500,001 to $1,000,000",19045,0.6000000238418579,27051,25511,18718,98.3,-1567,-29327746,16469,86.5,-35028512,-2127,2249,11.8,5700766,2534,326,1.7,326,1.7
+"Over $1,000,000",56592,1.7999999523162842,4277978,4019660,56592,100.0,-258322,-14618820608,49508,87.5,-17806082048,-359664,7084,12.5,3187261952,449920,1,0.0,1,0.0
+Total,3204719,100.0,77588,73015,1864540,58.2,-4573,-14654645248,1060532,33.1,-18153947136,-17118,804008,25.1,3499300352,4352,1340179,41.8,1336206,41.7
diff --git a/us/states/sc/sc_staging_dataset_summary_weighted.csv b/us/states/sc/sc_staging_dataset_summary_weighted.csv
deleted file mode 100644
index e7ac8fa..0000000
--- a/us/states/sc/sc_staging_dataset_summary_weighted.csv
+++ /dev/null
@@ -1,22 +0,0 @@
-Metric,Value
-Household count (weighted),"1,587,912"
-Person count (weighted),"4,788,894"
-Average household size,3.0
-Weighted median household AGI,"$60,378"
-Weighted average household AGI,"$105,617"
-Weighted median person AGI,"$56,366"
-Weighted average person AGI,"$100,583"
-Unweighted median household AGI,"$67,907"
-Unweighted median person AGI,"$67,460"
-25th percentile household AGI,"$27,117"
-75th percentile household AGI,"$105,515"
-90th percentile household AGI,"$153,279"
-95th percentile household AGI,"$237,856"
-Max household AGI,"$353,653,602"
-Total households with children,"637,558"
-Households with 1 child,"308,153"
-Households with 2 children,"190,106"
-Households with 3+ children,"139,299"
-Total children under 18,"1,157,115"
-Children under 6,"350,517"
-Children under 3,"177,575"

From 6af4913ccbf576c2b7136389eaaf71f205a2f86c Mon Sep 17 00:00:00 2001
From: David Trimmer <david@policyengine.org>
Date: Fri, 6 Mar 2026 12:35:49 -0500
Subject: [PATCH 10/12] Add sc_h4216_test_analysis.ipynb for RFA comparison

- Produces output in exact RFA format for direct comparison
- Uses test dataset (hf://policyengine/test/mar/SC.h5)
- Uses 5.39% top rate (RFA version)
- Exports to pe_h4216_test_analysis.csv
- Includes side-by-side comparison with RFA data

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 us/states/sc/sc_h4216_test_analysis.ipynb | 403 ++++++++++++++++++++++
 1 file changed, 403 insertions(+)
 create mode 100644 us/states/sc/sc_h4216_test_analysis.ipynb

diff --git a/us/states/sc/sc_h4216_test_analysis.ipynb b/us/states/sc/sc_h4216_test_analysis.ipynb
new file mode 100644
index 0000000..95e1d55
--- /dev/null
+++ b/us/states/sc/sc_h4216_test_analysis.ipynb
@@ -0,0 +1,403 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "cell-0",
+   "metadata": {},
+   "source": [
+    "# SC H.4216 Tax Reform Analysis - Test Dataset\n",
+    "\n",
+    "This notebook produces analysis in the same format as the RFA fiscal note for direct comparison.\n",
+    "\n",
+    "**Dataset:** `hf://policyengine/test/mar/SC.h5`\n",
+    "\n",
+    "**Reform:** H.4216 with 5.39% top rate (RFA version)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "cell-1",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from policyengine_us import Microsimulation\n",
+    "from policyengine_us.reforms.states.sc.h4216.sc_h4216 import create_sc_h4216\n",
+    "from policyengine_core.reforms import Reform\n",
+    "import pandas as pd\n",
+    "import numpy as np\n",
+    "\n",
+    "SC_DATASET = \"hf://policyengine/test/mar/SC.h5\"\n",
+    "TAX_YEAR = 2026"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "cell-2",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def create_h4216_reform(top_rate=0.0539):\n",
+    "    \"\"\"\n",
+    "    SC H.4216 Reform:\n",
+    "    - 1.99% up to $30k\n",
+    "    - top_rate over $30k (default 5.39% for RFA comparison)\n",
+    "    \"\"\"\n",
+    "    param_reform = Reform.from_dict(\n",
+    "        {\n",
+    "            \"gov.contrib.states.sc.h4216.in_effect\": {\n",
+    "                \"2026-01-01.2100-12-31\": True\n",
+    "            },\n",
+    "            \"gov.contrib.states.sc.h4216.rates[1].rate\": {\n",
+    "                \"2026-01-01.2100-12-31\": top_rate\n",
+    "            }\n",
+    "        },\n",
+    "        country_id=\"us\",\n",
+    "    )\n",
+    "    base_reform = create_sc_h4216()\n",
+    "    return (base_reform, param_reform)\n",
+    "\n",
+    "print(\"Loading simulations...\")\n",
+    "baseline = Microsimulation(dataset=SC_DATASET)\n",
+    "reform_sim = Microsimulation(dataset=SC_DATASET, reform=create_h4216_reform(0.0539))\n",
+    "print(\"Done!\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "cell-3",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Get data - use .values to avoid double-weighting\n",
+    "baseline_tax = baseline.calculate(\"sc_income_tax\", period=TAX_YEAR, map_to=\"tax_unit\").values\n",
+    "reform_tax = reform_sim.calculate(\"sc_income_tax\", period=TAX_YEAR, map_to=\"tax_unit\").values\n",
+    "agi = baseline.calculate(\"adjusted_gross_income\", period=TAX_YEAR, map_to=\"tax_unit\").values\n",
+    "weight = baseline.calculate(\"tax_unit_weight\", period=TAX_YEAR).values\n",
+    "\n",
+    "tax_change = reform_tax - baseline_tax\n",
+    "\n",
+    "print(f\"Total tax units: {len(baseline_tax):,}\")\n",
+    "print(f\"Weighted tax units: {weight.sum():,.0f}\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "cell-4",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Define income brackets matching RFA exactly\n",
+    "income_brackets = [\n",
+    "    (float('-inf'), 0, \"$0*\"),\n",
+    "    (0, 10000, \"$1 to $10000\"),\n",
+    "    (10000, 20000, \"$10001 to $20000\"),\n",
+    "    (20000, 30000, \"$20001 to $30000\"),\n",
+    "    (30000, 40000, \"$30001 to $40000\"),\n",
+    "    (40000, 50000, \"$40001 to $50000\"),\n",
+    "    (50000, 75000, \"$50001 to $75000\"),\n",
+    "    (75000, 100000, \"$75001 to $100000\"),\n",
+    "    (100000, 150000, \"$100001 to $150000\"),\n",
+    "    (150000, 200000, \"$150001 to $200000\"),\n",
+    "    (200000, 300000, \"$200001 to $300000\"),\n",
+    "    (300000, 500000, \"$300001 to $500000\"),\n",
+    "    (500000, 1000000, \"$500001 to $1000000\"),\n",
+    "    (1000000, float('inf'), \"Over $1000000\")\n",
+    "]\n",
+    "\n",
+    "total_weight = weight.sum()\n",
+    "results = []\n",
+    "\n",
+    "for lower, upper, label in income_brackets:\n",
+    "    if lower == float('-inf'):\n",
+    "        mask = agi <= upper\n",
+    "    elif upper == float('inf'):\n",
+    "        mask = agi > lower\n",
+    "    else:\n",
+    "        mask = (agi > lower) & (agi <= upper)\n",
+    "    \n",
+    "    if mask.sum() == 0:\n",
+    "        continue\n",
+    "    \n",
+    "    # Basic stats\n",
+    "    est_returns = weight[mask].sum()\n",
+    "    pct_returns = est_returns / total_weight * 100\n",
+    "    \n",
+    "    old_avg_tax = np.average(baseline_tax[mask], weights=weight[mask]) if est_returns > 0 else 0\n",
+    "    new_avg_tax = np.average(reform_tax[mask], weights=weight[mask]) if est_returns > 0 else 0\n",
+    "    \n",
+    "    # Returns with tax change (threshold $1)\n",
+    "    change_mask = mask & (np.abs(tax_change) > 1)\n",
+    "    returns_with_change = weight[change_mask].sum()\n",
+    "    pct_with_change = returns_with_change / est_returns * 100 if est_returns > 0 else 0\n",
+    "    \n",
+    "    if returns_with_change > 0:\n",
+    "        old_avg_changed = np.average(baseline_tax[change_mask], weights=weight[change_mask])\n",
+    "        new_avg_changed = np.average(reform_tax[change_mask], weights=weight[change_mask])\n",
+    "        avg_change = np.average(tax_change[change_mask], weights=weight[change_mask])\n",
+    "    else:\n",
+    "        old_avg_changed = 0\n",
+    "        new_avg_changed = 0\n",
+    "        avg_change = 0\n",
+    "    \n",
+    "    total_change = (tax_change[mask] * weight[mask]).sum()\n",
+    "    \n",
+    "    # Tax decrease\n",
+    "    decrease_mask = mask & (tax_change < -1)\n",
+    "    decrease_returns = weight[decrease_mask].sum()\n",
+    "    decrease_pct = decrease_returns / est_returns * 100 if est_returns > 0 else 0\n",
+    "    total_decrease = (tax_change[decrease_mask] * weight[decrease_mask]).sum() if decrease_returns > 0 else 0\n",
+    "    avg_decrease = np.average(tax_change[decrease_mask], weights=weight[decrease_mask]) if decrease_returns > 0 else 0\n",
+    "    \n",
+    "    # Tax increase\n",
+    "    increase_mask = mask & (tax_change > 1)\n",
+    "    increase_returns = weight[increase_mask].sum()\n",
+    "    increase_pct = increase_returns / est_returns * 100 if est_returns > 0 else 0\n",
+    "    total_increase = (tax_change[increase_mask] * weight[increase_mask]).sum() if increase_returns > 0 else 0\n",
+    "    avg_increase = np.average(tax_change[increase_mask], weights=weight[increase_mask]) if increase_returns > 0 else 0\n",
+    "    \n",
+    "    # No change\n",
+    "    no_change_mask = mask & (np.abs(tax_change) <= 1)\n",
+    "    no_change_returns = weight[no_change_mask].sum()\n",
+    "    no_change_pct = no_change_returns / est_returns * 100 if est_returns > 0 else 0\n",
+    "    \n",
+    "    # Zero tax\n",
+    "    zero_tax_mask = mask & (reform_tax <= 0)\n",
+    "    zero_tax_returns = weight[zero_tax_mask].sum()\n",
+    "    zero_tax_pct = zero_tax_returns / est_returns * 100 if est_returns > 0 else 0\n",
+    "    \n",
+    "    results.append({\n",
+    "        \"Federal AGI Range\": label,\n",
+    "        \"Est # Returns\": int(round(est_returns)),\n",
+    "        \"Est % Returns\": f\"{pct_returns:.1f}%\",\n",
+    "        \"Old Avg Tax Liability\": f\"${int(round(old_avg_tax))}\",\n",
+    "        \"New Avg Tax Liability\": f\"${int(round(new_avg_tax))}\",\n",
+    "        \"Returns with Tax Change\": int(round(returns_with_change)),\n",
+    "        \"% Returns in Range with Change\": f\"{pct_with_change:.1f}%\",\n",
+    "        \"Old Avg Tax (Changed)\": f\"${int(round(old_avg_changed))}\",\n",
+    "        \"New Avg Tax (Changed)\": f\"${int(round(new_avg_changed))}\",\n",
+    "        \"Avg Tax Change\": f\"${int(round(avg_change))}\",\n",
+    "        \"Total Dollar Change\": f\"${int(round(total_change))}\",\n",
+    "        \"Tax Decrease # Returns\": int(round(decrease_returns)),\n",
+    "        \"Tax Decrease % in Range\": f\"{decrease_pct:.1f}%\",\n",
+    "        \"Total Decrease Amount\": f\"${int(round(total_decrease))}\",\n",
+    "        \"Avg Decrease Amount\": f\"${int(round(avg_decrease))}\",\n",
+    "        \"Tax Increase # Returns\": int(round(increase_returns)),\n",
+    "        \"Tax Increase % in Range\": f\"{increase_pct:.1f}%\",\n",
+    "        \"Total Increase Amount\": f\"${int(round(total_increase))}\",\n",
+    "        \"Avg Increase Amount\": f\"${int(round(avg_increase))}\",\n",
+    "        \"No Tax Change # Returns\": int(round(no_change_returns)),\n",
+    "        \"No Change % Returns\": f\"{no_change_pct:.1f}%\",\n",
+    "        \"Zero Tax # Returns\": int(round(zero_tax_returns)),\n",
+    "        \"Zero Tax % Returns\": f\"{zero_tax_pct:.1f}%\"\n",
+    "    })\n",
+    "\n",
+    "print(\"Bracket analysis complete!\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "cell-5",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Calculate totals\n",
+    "change_mask_all = np.abs(tax_change) > 1\n",
+    "decrease_mask_all = tax_change < -1\n",
+    "increase_mask_all = tax_change > 1\n",
+    "no_change_mask_all = np.abs(tax_change) <= 1\n",
+    "zero_tax_mask_all = reform_tax <= 0\n",
+    "\n",
+    "total_old_avg = np.average(baseline_tax, weights=weight)\n",
+    "total_new_avg = np.average(reform_tax, weights=weight)\n",
+    "total_change_amount = (tax_change * weight).sum()\n",
+    "\n",
+    "returns_with_change_all = weight[change_mask_all].sum()\n",
+    "old_avg_changed_all = np.average(baseline_tax[change_mask_all], weights=weight[change_mask_all]) if returns_with_change_all > 0 else 0\n",
+    "new_avg_changed_all = np.average(reform_tax[change_mask_all], weights=weight[change_mask_all]) if returns_with_change_all > 0 else 0\n",
+    "avg_change_all = np.average(tax_change[change_mask_all], weights=weight[change_mask_all]) if returns_with_change_all > 0 else 0\n",
+    "\n",
+    "decrease_returns_all = weight[decrease_mask_all].sum()\n",
+    "total_decrease_all = (tax_change[decrease_mask_all] * weight[decrease_mask_all]).sum()\n",
+    "avg_decrease_all = np.average(tax_change[decrease_mask_all], weights=weight[decrease_mask_all]) if decrease_returns_all > 0 else 0\n",
+    "\n",
+    "increase_returns_all = weight[increase_mask_all].sum()\n",
+    "total_increase_all = (tax_change[increase_mask_all] * weight[increase_mask_all]).sum()\n",
+    "avg_increase_all = np.average(tax_change[increase_mask_all], weights=weight[increase_mask_all]) if increase_returns_all > 0 else 0\n",
+    "\n",
+    "no_change_returns_all = weight[no_change_mask_all].sum()\n",
+    "zero_tax_returns_all = weight[zero_tax_mask_all].sum()\n",
+    "\n",
+    "results.append({\n",
+    "    \"Federal AGI Range\": \"Total\",\n",
+    "    \"Est # Returns\": int(round(total_weight)),\n",
+    "    \"Est % Returns\": \"100.0%\",\n",
+    "    \"Old Avg Tax Liability\": f\"${int(round(total_old_avg))}\",\n",
+    "    \"New Avg Tax Liability\": f\"${int(round(total_new_avg))}\",\n",
+    "    \"Returns with Tax Change\": int(round(returns_with_change_all)),\n",
+    "    \"% Returns in Range with Change\": f\"{returns_with_change_all / total_weight * 100:.1f}%\",\n",
+    "    \"Old Avg Tax (Changed)\": f\"${int(round(old_avg_changed_all))}\",\n",
+    "    \"New Avg Tax (Changed)\": f\"${int(round(new_avg_changed_all))}\",\n",
+    "    \"Avg Tax Change\": f\"${int(round(avg_change_all))}\",\n",
+    "    \"Total Dollar Change\": f\"${int(round(total_change_amount))}\",\n",
+    "    \"Tax Decrease # Returns\": int(round(decrease_returns_all)),\n",
+    "    \"Tax Decrease % in Range\": f\"{decrease_returns_all / total_weight * 100:.1f}%\",\n",
+    "    \"Total Decrease Amount\": f\"${int(round(total_decrease_all))}\",\n",
+    "    \"Avg Decrease Amount\": f\"${int(round(avg_decrease_all))}\",\n",
+    "    \"Tax Increase # Returns\": int(round(increase_returns_all)),\n",
+    "    \"Tax Increase % in Range\": f\"{increase_returns_all / total_weight * 100:.1f}%\",\n",
+    "    \"Total Increase Amount\": f\"${int(round(total_increase_all))}\",\n",
+    "    \"Avg Increase Amount\": f\"${int(round(avg_increase_all))}\",\n",
+    "    \"No Tax Change # Returns\": int(round(no_change_returns_all)),\n",
+    "    \"No Change % Returns\": f\"{no_change_returns_all / total_weight * 100:.1f}%\",\n",
+    "    \"Zero Tax # Returns\": int(round(zero_tax_returns_all)),\n",
+    "    \"Zero Tax % Returns\": f\"{zero_tax_returns_all / total_weight * 100:.1f}%\"\n",
+    "})\n",
+    "\n",
+    "df_results = pd.DataFrame(results)\n",
+    "print(\"Totals calculated!\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "cell-6",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Display summary\n",
+    "print(\"=\"*100)\n",
+    "print(\"H.4216 - POLICYENGINE ANALYSIS (Test Dataset, 5.39% Top Rate)\")\n",
+    "print(\"=\"*100)\n",
+    "print(f\"\\nTotal Returns: {int(total_weight):,}\")\n",
+    "print(f\"General Fund Impact: ${total_change_amount:,.0f}\")\n",
+    "print(f\"\\nRFA Estimate: -$119,100,000\")\n",
+    "print(f\"Difference: ${total_change_amount - (-119100000):,.0f}\")\n",
+    "print(f\"Accuracy: {(1 - abs(total_change_amount - (-119100000)) / 119100000) * 100:.1f}%\")\n",
+    "print(\"=\"*100)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "cell-7",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Export to CSV in RFA format\n",
+    "df_results.to_csv('pe_h4216_test_analysis.csv', index=False)\n",
+    "print(\"Exported to: pe_h4216_test_analysis.csv\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "cell-8",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Display key columns for quick comparison\n",
+    "display_cols = [\n",
+    "    \"Federal AGI Range\", \"Est # Returns\", \"Est % Returns\",\n",
+    "    \"Old Avg Tax Liability\", \"New Avg Tax Liability\", \"Total Dollar Change\"\n",
+    "]\n",
+    "print(\"\\nKEY METRICS:\")\n",
+    "print(df_results[display_cols].to_string(index=False))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "cell-9",
+   "metadata": {},
+   "source": [
+    "## Side-by-Side Comparison with RFA"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "cell-10",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Load RFA data\n",
+    "rfa_df = pd.read_csv('rfa_h4216_analysis.csv')\n",
+    "\n",
+    "def parse_dollar(val):\n",
+    "    if isinstance(val, str):\n",
+    "        return float(val.replace('$', '').replace(',', '').replace('%', ''))\n",
+    "    return val\n",
+    "\n",
+    "def parse_pct(val):\n",
+    "    if isinstance(val, str):\n",
+    "        return float(val.replace('%', ''))\n",
+    "    return val\n",
+    "\n",
+    "# Create comparison\n",
+    "comparison = []\n",
+    "for idx, pe_row in df_results.iterrows():\n",
+    "    agi_range = pe_row['Federal AGI Range']\n",
+    "    rfa_match = rfa_df[rfa_df['Federal AGI Range'] == agi_range]\n",
+    "    \n",
+    "    pe_returns = pe_row['Est # Returns']\n",
+    "    pe_impact = parse_dollar(pe_row['Total Dollar Change'])\n",
+    "    \n",
+    "    if len(rfa_match) > 0:\n",
+    "        rfa_returns = rfa_match['Est # Returns'].values[0]\n",
+    "        rfa_impact = parse_dollar(rfa_match['Total Dollar Change'].values[0])\n",
+    "    else:\n",
+    "        rfa_returns = 0\n",
+    "        rfa_impact = 0\n",
+    "    \n",
+    "    comparison.append({\n",
+    "        'AGI Range': agi_range,\n",
+    "        'PE Returns': f\"{pe_returns:,}\",\n",
+    "        'RFA Returns': f\"{rfa_returns:,}\" if rfa_returns else \"N/A\",\n",
+    "        'PE Impact': f\"${pe_impact:,.0f}\",\n",
+    "        'RFA Impact': f\"${rfa_impact:,.0f}\" if rfa_impact else \"N/A\",\n",
+    "        'Diff': f\"${pe_impact - rfa_impact:+,.0f}\" if rfa_impact else \"N/A\"\n",
+    "    })\n",
+    "\n",
+    "comparison_df = pd.DataFrame(comparison)\n",
+    "print(\"\\n\" + \"=\"*100)\n",
+    "print(\"POLICYENGINE vs RFA COMPARISON\")\n",
+    "print(\"=\"*100)\n",
+    "print(comparison_df.to_string(index=False))\n",
+    "print(\"=\"*100)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "cell-11",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Full results table\n",
+    "print(\"\\n\" + \"=\"*120)\n",
+    "print(\"FULL POLICYENGINE ANALYSIS (RFA Format)\")\n",
+    "print(\"=\"*120)\n",
+    "pd.set_option('display.max_columns', None)\n",
+    "pd.set_option('display.width', None)\n",
+    "print(df_results.to_string(index=False))"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "name": "python",
+   "version": "3.11.0"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}

From bc43548ce0381858752ee845166a03d506ed57b7 Mon Sep 17 00:00:00 2001
From: David Trimmer <david@policyengine.org>
Date: Fri, 6 Mar 2026 12:45:15 -0500
Subject: [PATCH 11/12] Update SC H.4216 analysis with dataset comparison
 findings

- Add detailed analysis explaining why Production overestimates and Test underestimates
- Core issue: baseline revenue calibration ($6.5B Production vs $4.0B Test vs $6.4B RFA)
- Add test dataset exploration notebook and summary CSV
- Update comparison markdown with recommendations

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 us/states/sc/data_exploration.ipynb           | 354 +++++++++++++++++-
 us/states/sc/data_exploration_test.ipynb      | 179 ++++++++-
 us/states/sc/h4216_analysis_comparison.md     | 269 ++++++-------
 us/states/sc/pe_h4216_test_analysis.csv       |  16 +
 us/states/sc/sc_h4216_test_analysis.ipynb     | 188 +++++++++-
 .../sc/sc_test_dataset_summary_weighted.csv   |  22 ++
 6 files changed, 825 insertions(+), 203 deletions(-)
 create mode 100644 us/states/sc/pe_h4216_test_analysis.csv
 create mode 100644 us/states/sc/sc_test_dataset_summary_weighted.csv

diff --git a/us/states/sc/data_exploration.ipynb b/us/states/sc/data_exploration.ipynb
index b4ba407..e6978a6 100644
--- a/us/states/sc/data_exploration.ipynb
+++ b/us/states/sc/data_exploration.ipynb
@@ -34,45 +34,361 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 3,
    "metadata": {},
-   "outputs": [],
-   "source": "# Check dataset size - use .values to get raw arrays (avoid MicroSeries auto-weighting)\nhousehold_weight = sim.calculate(\"household_weight\", period=2025).values\nhousehold_count = sim.calculate(\"household_count\", period=2025, map_to=\"household\").values\nperson_count = sim.calculate(\"person_count\", period=2025, map_to=\"household\").values\n\n# Weighted sums using raw arrays\nweighted_household_count = (household_count * household_weight).sum()\nweighted_person_count = (person_count * household_weight).sum()\n\nprint(f\"Number of households in dataset: {len(household_weight):,}\")\nprint(f\"Household count (weighted): {weighted_household_count:,.0f}\")\nprint(f\"Person count (weighted): {weighted_person_count:,.0f}\")"
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Number of households in dataset: 35,324\n",
+      "Household count (weighted): 1,887,388\n",
+      "Person count (weighted): 5,451,832\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Check dataset size - use .values to get raw arrays (avoid MicroSeries auto-weighting)\n",
+    "household_weight = sim.calculate(\"household_weight\", period=2025).values\n",
+    "household_count = sim.calculate(\"household_count\", period=2025, map_to=\"household\").values\n",
+    "person_count = sim.calculate(\"person_count\", period=2025, map_to=\"household\").values\n",
+    "\n",
+    "# Weighted sums using raw arrays\n",
+    "weighted_household_count = (household_count * household_weight).sum()\n",
+    "weighted_person_count = (person_count * household_weight).sum()\n",
+    "\n",
+    "print(f\"Number of households in dataset: {len(household_weight):,}\")\n",
+    "print(f\"Household count (weighted): {weighted_household_count:,.0f}\")\n",
+    "print(f\"Person count (weighted): {weighted_person_count:,.0f}\")"
+   ]
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 4,
    "metadata": {},
-   "outputs": [],
-   "source": "# Check income distribution (weighted vs unweighted, household and person level)\n# Use .values to get raw numpy arrays (avoid MicroSeries auto-weighting)\nagi_hh_array = sim.calculate(\"adjusted_gross_income\", period=2025, map_to=\"household\").values\nhh_weights = sim.calculate(\"household_weight\", period=2025).values\n\nagi_person_array = sim.calculate(\"adjusted_gross_income\", period=2025, map_to=\"person\").values\nperson_weights = sim.calculate(\"person_weight\", period=2025).values\n\n# Weighted percentile calculation\ndef weighted_percentile(values, weights, percentile):\n    sorted_indices = np.argsort(values)\n    sorted_values = values[sorted_indices]\n    sorted_weights = weights[sorted_indices]\n    cumulative_weight = np.cumsum(sorted_weights)\n    idx = np.searchsorted(cumulative_weight, cumulative_weight[-1] * percentile / 100)\n    return sorted_values[min(idx, len(sorted_values)-1)]\n\n# Unweighted medians\nunweighted_median_hh = np.median(agi_hh_array)\nunweighted_median_person = np.median(agi_person_array)\n\n# Weighted medians\nweighted_median_hh = weighted_percentile(agi_hh_array, hh_weights, 50)\nweighted_median_person = weighted_percentile(agi_person_array, person_weights, 50)\n\n# Weighted averages\nweighted_avg_hh = np.average(agi_hh_array, weights=hh_weights)\nweighted_avg_person = np.average(agi_person_array, weights=person_weights)\n\n# Average household size\ntotal_persons = person_weights.sum()\ntotal_households = hh_weights.sum()\navg_hh_size = total_persons / total_households\n\nprint(\"=\" * 60)\nprint(\"INCOME DISTRIBUTION SUMMARY\")\nprint(\"=\" * 60)\nprint(f\"\\nHousehold AGI:\")\nprint(f\"  Unweighted median: ${unweighted_median_hh:,.0f}\")\nprint(f\"  Weighted median:   ${weighted_median_hh:,.0f}\")\nprint(f\"  Weighted average:  ${weighted_avg_hh:,.0f}\")\n\nprint(f\"\\nPerson AGI:\")\nprint(f\"  Unweighted median: ${unweighted_median_person:,.0f}\")\nprint(f\"  Weighted median:   ${weighted_median_person:,.0f}\")\nprint(f\"  Weighted average:  ${weighted_avg_person:,.0f}\")\n\nprint(f\"\\nAverage household size: {avg_hh_size:.1f}\")\n\nprint(f\"\\nWeighted household AGI percentiles:\")\nprint(f\"  25th percentile: ${weighted_percentile(agi_hh_array, hh_weights, 25):,.0f}\")\nprint(f\"  50th percentile: ${weighted_percentile(agi_hh_array, hh_weights, 50):,.0f}\")\nprint(f\"  75th percentile: ${weighted_percentile(agi_hh_array, hh_weights, 75):,.0f}\")\nprint(f\"  90th percentile: ${weighted_percentile(agi_hh_array, hh_weights, 90):,.0f}\")\nprint(f\"  95th percentile: ${weighted_percentile(agi_hh_array, hh_weights, 95):,.0f}\")\nprint(f\"  Max AGI: ${agi_hh_array.max():,.0f}\")"
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "============================================================\n",
+      "INCOME DISTRIBUTION SUMMARY\n",
+      "============================================================\n",
+      "\n",
+      "Household AGI:\n",
+      "  Unweighted median: $41,884\n",
+      "  Weighted median:   $43,222\n",
+      "  Weighted average:  $103,858\n",
+      "\n",
+      "Person AGI:\n",
+      "  Unweighted median: $40,216\n",
+      "  Weighted median:   $38,962\n",
+      "  Weighted average:  $93,926\n",
+      "\n",
+      "Average household size: 2.9\n",
+      "\n",
+      "Weighted household AGI percentiles:\n",
+      "  25th percentile: $9,425\n",
+      "  50th percentile: $43,222\n",
+      "  75th percentile: $91,877\n",
+      "  90th percentile: $167,068\n",
+      "  95th percentile: $268,311\n",
+      "  Max AGI: $6,430,892\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Check income distribution (weighted vs unweighted, household and person level)\n",
+    "# Use .values to get raw numpy arrays (avoid MicroSeries auto-weighting)\n",
+    "agi_hh_array = sim.calculate(\"adjusted_gross_income\", period=2025, map_to=\"household\").values\n",
+    "hh_weights = sim.calculate(\"household_weight\", period=2025).values\n",
+    "\n",
+    "agi_person_array = sim.calculate(\"adjusted_gross_income\", period=2025, map_to=\"person\").values\n",
+    "person_weights = sim.calculate(\"person_weight\", period=2025).values\n",
+    "\n",
+    "# Weighted percentile calculation\n",
+    "def weighted_percentile(values, weights, percentile):\n",
+    "    sorted_indices = np.argsort(values)\n",
+    "    sorted_values = values[sorted_indices]\n",
+    "    sorted_weights = weights[sorted_indices]\n",
+    "    cumulative_weight = np.cumsum(sorted_weights)\n",
+    "    idx = np.searchsorted(cumulative_weight, cumulative_weight[-1] * percentile / 100)\n",
+    "    return sorted_values[min(idx, len(sorted_values)-1)]\n",
+    "\n",
+    "# Unweighted medians\n",
+    "unweighted_median_hh = np.median(agi_hh_array)\n",
+    "unweighted_median_person = np.median(agi_person_array)\n",
+    "\n",
+    "# Weighted medians\n",
+    "weighted_median_hh = weighted_percentile(agi_hh_array, hh_weights, 50)\n",
+    "weighted_median_person = weighted_percentile(agi_person_array, person_weights, 50)\n",
+    "\n",
+    "# Weighted averages\n",
+    "weighted_avg_hh = np.average(agi_hh_array, weights=hh_weights)\n",
+    "weighted_avg_person = np.average(agi_person_array, weights=person_weights)\n",
+    "\n",
+    "# Average household size\n",
+    "total_persons = person_weights.sum()\n",
+    "total_households = hh_weights.sum()\n",
+    "avg_hh_size = total_persons / total_households\n",
+    "\n",
+    "print(\"=\" * 60)\n",
+    "print(\"INCOME DISTRIBUTION SUMMARY\")\n",
+    "print(\"=\" * 60)\n",
+    "print(f\"\\nHousehold AGI:\")\n",
+    "print(f\"  Unweighted median: ${unweighted_median_hh:,.0f}\")\n",
+    "print(f\"  Weighted median:   ${weighted_median_hh:,.0f}\")\n",
+    "print(f\"  Weighted average:  ${weighted_avg_hh:,.0f}\")\n",
+    "\n",
+    "print(f\"\\nPerson AGI:\")\n",
+    "print(f\"  Unweighted median: ${unweighted_median_person:,.0f}\")\n",
+    "print(f\"  Weighted median:   ${weighted_median_person:,.0f}\")\n",
+    "print(f\"  Weighted average:  ${weighted_avg_person:,.0f}\")\n",
+    "\n",
+    "print(f\"\\nAverage household size: {avg_hh_size:.1f}\")\n",
+    "\n",
+    "print(f\"\\nWeighted household AGI percentiles:\")\n",
+    "print(f\"  25th percentile: ${weighted_percentile(agi_hh_array, hh_weights, 25):,.0f}\")\n",
+    "print(f\"  50th percentile: ${weighted_percentile(agi_hh_array, hh_weights, 50):,.0f}\")\n",
+    "print(f\"  75th percentile: ${weighted_percentile(agi_hh_array, hh_weights, 75):,.0f}\")\n",
+    "print(f\"  90th percentile: ${weighted_percentile(agi_hh_array, hh_weights, 90):,.0f}\")\n",
+    "print(f\"  95th percentile: ${weighted_percentile(agi_hh_array, hh_weights, 95):,.0f}\")\n",
+    "print(f\"  Max AGI: ${agi_hh_array.max():,.0f}\")"
+   ]
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 5,
    "metadata": {},
-   "outputs": [],
-   "source": "# Check households with children - use .values for raw arrays\nis_child = sim.calculate(\"is_child\", period=2025, map_to=\"person\").values\nhousehold_id = sim.calculate(\"household_id\", period=2025, map_to=\"person\").values\nhousehold_weight_person = sim.calculate(\"household_weight\", period=2025, map_to=\"person\").values\n\n# Create DataFrame\ndf_households = pd.DataFrame({\n    'household_id': household_id,\n    'is_child': is_child,\n    'household_weight': household_weight_person\n})\n\n# Count children per household\nchildren_per_household = df_households.groupby('household_id').agg({\n    'is_child': 'sum',\n    'household_weight': 'first'\n}).reset_index()\n\n# Calculate weighted household counts\ntotal_households_with_children = children_per_household[children_per_household['is_child'] > 0]['household_weight'].sum()\nhouseholds_with_1_child = children_per_household[children_per_household['is_child'] == 1]['household_weight'].sum()\nhouseholds_with_2_children = children_per_household[children_per_household['is_child'] == 2]['household_weight'].sum()\nhouseholds_with_3plus_children = children_per_household[children_per_household['is_child'] >= 3]['household_weight'].sum()\n\nprint(f\"\\nHouseholds with children (weighted):\")\nprint(f\"  Total households with children: {total_households_with_children:,.0f}\")\nprint(f\"  Households with 1 child: {households_with_1_child:,.0f}\")\nprint(f\"  Households with 2 children: {households_with_2_children:,.0f}\")\nprint(f\"  Households with 3+ children: {households_with_3plus_children:,.0f}\")"
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "Households with children (weighted):\n",
+      "  Total households with children: 598,564\n",
+      "  Households with 1 child: 247,956\n",
+      "  Households with 2 children: 190,545\n",
+      "  Households with 3+ children: 160,063\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Check households with children - use .values for raw arrays\n",
+    "is_child = sim.calculate(\"is_child\", period=2025, map_to=\"person\").values\n",
+    "household_id = sim.calculate(\"household_id\", period=2025, map_to=\"person\").values\n",
+    "household_weight_person = sim.calculate(\"household_weight\", period=2025, map_to=\"person\").values\n",
+    "\n",
+    "# Create DataFrame\n",
+    "df_households = pd.DataFrame({\n",
+    "    'household_id': household_id,\n",
+    "    'is_child': is_child,\n",
+    "    'household_weight': household_weight_person\n",
+    "})\n",
+    "\n",
+    "# Count children per household\n",
+    "children_per_household = df_households.groupby('household_id').agg({\n",
+    "    'is_child': 'sum',\n",
+    "    'household_weight': 'first'\n",
+    "}).reset_index()\n",
+    "\n",
+    "# Calculate weighted household counts\n",
+    "total_households_with_children = children_per_household[children_per_household['is_child'] > 0]['household_weight'].sum()\n",
+    "households_with_1_child = children_per_household[children_per_household['is_child'] == 1]['household_weight'].sum()\n",
+    "households_with_2_children = children_per_household[children_per_household['is_child'] == 2]['household_weight'].sum()\n",
+    "households_with_3plus_children = children_per_household[children_per_household['is_child'] >= 3]['household_weight'].sum()\n",
+    "\n",
+    "print(f\"\\nHouseholds with children (weighted):\")\n",
+    "print(f\"  Total households with children: {total_households_with_children:,.0f}\")\n",
+    "print(f\"  Households with 1 child: {households_with_1_child:,.0f}\")\n",
+    "print(f\"  Households with 2 children: {households_with_2_children:,.0f}\")\n",
+    "print(f\"  Households with 3+ children: {households_with_3plus_children:,.0f}\")"
+   ]
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 6,
    "metadata": {},
-   "outputs": [],
-   "source": "# Check children by age groups - use .values for raw arrays\ndf = pd.DataFrame({\n    \"household_id\": sim.calculate(\"household_id\", map_to=\"person\").values,\n    \"tax_unit_id\": sim.calculate(\"tax_unit_id\", map_to=\"person\").values,\n    \"person_id\": sim.calculate(\"person_id\", map_to=\"person\").values,\n    \"age\": sim.calculate(\"age\", map_to=\"person\").values,\n    \"person_weight\": sim.calculate(\"person_weight\", map_to=\"person\").values\n})\n\n# Filter for children and apply weights\nchildren_under_18_df = df[df['age'] < 18]\nchildren_under_6_df = df[df['age'] < 6]\nchildren_under_3_df = df[df['age'] < 3]\n\n# Calculate weighted totals\ntotal_children = children_under_18_df['person_weight'].sum()\nchildren_under_6 = children_under_6_df['person_weight'].sum()\nchildren_under_3 = children_under_3_df['person_weight'].sum()\n\nprint(f\"\\nChildren by age:\")\nprint(f\"  Total children under 18: {total_children:,.0f}\")\nprint(f\"  Children under 6: {children_under_6:,.0f}\")\nprint(f\"  Children under 3: {children_under_3:,.0f}\")"
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "Children by age:\n",
+      "  Total children under 18: 1,198,147\n",
+      "  Children under 6: 349,101\n",
+      "  Children under 3: 169,412\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Check children by age groups - use .values for raw arrays\n",
+    "df = pd.DataFrame({\n",
+    "    \"household_id\": sim.calculate(\"household_id\", map_to=\"person\").values,\n",
+    "    \"tax_unit_id\": sim.calculate(\"tax_unit_id\", map_to=\"person\").values,\n",
+    "    \"person_id\": sim.calculate(\"person_id\", map_to=\"person\").values,\n",
+    "    \"age\": sim.calculate(\"age\", map_to=\"person\").values,\n",
+    "    \"person_weight\": sim.calculate(\"person_weight\", map_to=\"person\").values\n",
+    "})\n",
+    "\n",
+    "# Filter for children and apply weights\n",
+    "children_under_18_df = df[df['age'] < 18]\n",
+    "children_under_6_df = df[df['age'] < 6]\n",
+    "children_under_3_df = df[df['age'] < 3]\n",
+    "\n",
+    "# Calculate weighted totals\n",
+    "total_children = children_under_18_df['person_weight'].sum()\n",
+    "children_under_6 = children_under_6_df['person_weight'].sum()\n",
+    "children_under_3 = children_under_3_df['person_weight'].sum()\n",
+    "\n",
+    "print(f\"\\nChildren by age:\")\n",
+    "print(f\"  Total children under 18: {total_children:,.0f}\")\n",
+    "print(f\"  Children under 6: {children_under_6:,.0f}\")\n",
+    "print(f\"  Children under 3: {children_under_3:,.0f}\")"
+   ]
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 7,
    "metadata": {},
-   "outputs": [],
-   "source": "# Create comprehensive summary table\nsummary_data = {\n    'Metric': [\n        'Household count (weighted)',\n        'Person count (weighted)',\n        'Average household size',\n        'Weighted median household AGI',\n        'Weighted average household AGI',\n        'Weighted median person AGI',\n        'Weighted average person AGI',\n        'Unweighted median household AGI',\n        'Unweighted median person AGI',\n        '25th percentile household AGI',\n        '75th percentile household AGI',\n        '90th percentile household AGI',\n        '95th percentile household AGI',\n        'Max household AGI',\n        'Total households with children',\n        'Households with 1 child',\n        'Households with 2 children',\n        'Households with 3+ children',\n        'Total children under 18',\n        'Children under 6',\n        'Children under 3'\n    ],\n    'Value': [\n        f\"{weighted_household_count:,.0f}\",\n        f\"{weighted_person_count:,.0f}\",\n        f\"{avg_hh_size:.1f}\",\n        f\"${weighted_median_hh:,.0f}\",\n        f\"${weighted_avg_hh:,.0f}\",\n        f\"${weighted_median_person:,.0f}\",\n        f\"${weighted_avg_person:,.0f}\",\n        f\"${unweighted_median_hh:,.0f}\",\n        f\"${unweighted_median_person:,.0f}\",\n        f\"${weighted_percentile(agi_hh_array, hh_weights, 25):,.0f}\",\n        f\"${weighted_percentile(agi_hh_array, hh_weights, 75):,.0f}\",\n        f\"${weighted_percentile(agi_hh_array, hh_weights, 90):,.0f}\",\n        f\"${weighted_percentile(agi_hh_array, hh_weights, 95):,.0f}\",\n        f\"${agi_hh_array.max():,.0f}\",\n        f\"{total_households_with_children:,.0f}\",\n        f\"{households_with_1_child:,.0f}\",\n        f\"{households_with_2_children:,.0f}\",\n        f\"{households_with_3plus_children:,.0f}\",\n        f\"{total_children:,.0f}\",\n        f\"{children_under_6:,.0f}\",\n        f\"{children_under_3:,.0f}\"\n    ]\n}\n\nsummary_df = pd.DataFrame(summary_data)\n\nprint(\"\\n\" + \"=\"*65)\nprint(\"SC DATASET SUMMARY - WEIGHTED (Population Estimates)\")\nprint(\"=\"*65)\nprint(summary_df.to_string(index=False))\nprint(\"=\"*65)\n\n# Save table\nsummary_df.to_csv('sc_dataset_summary_weighted.csv', index=False)\nprint(\"\\nSummary saved to: sc_dataset_summary_weighted.csv\")"
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "=================================================================\n",
+      "SC DATASET SUMMARY - WEIGHTED (Population Estimates)\n",
+      "=================================================================\n",
+      "                         Metric      Value\n",
+      "     Household count (weighted)  1,887,388\n",
+      "        Person count (weighted)  5,451,832\n",
+      "         Average household size        2.9\n",
+      "  Weighted median household AGI    $43,222\n",
+      " Weighted average household AGI   $103,858\n",
+      "     Weighted median person AGI    $38,962\n",
+      "    Weighted average person AGI    $93,926\n",
+      "Unweighted median household AGI    $41,884\n",
+      "   Unweighted median person AGI    $40,216\n",
+      "  25th percentile household AGI     $9,425\n",
+      "  75th percentile household AGI    $91,877\n",
+      "  90th percentile household AGI   $167,068\n",
+      "  95th percentile household AGI   $268,311\n",
+      "              Max household AGI $6,430,892\n",
+      " Total households with children    598,564\n",
+      "        Households with 1 child    247,956\n",
+      "     Households with 2 children    190,545\n",
+      "    Households with 3+ children    160,063\n",
+      "        Total children under 18  1,198,147\n",
+      "               Children under 6    349,101\n",
+      "               Children under 3    169,412\n",
+      "=================================================================\n",
+      "\n",
+      "Summary saved to: sc_dataset_summary_weighted.csv\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Create comprehensive summary table\n",
+    "summary_data = {\n",
+    "    'Metric': [\n",
+    "        'Household count (weighted)',\n",
+    "        'Person count (weighted)',\n",
+    "        'Average household size',\n",
+    "        'Weighted median household AGI',\n",
+    "        'Weighted average household AGI',\n",
+    "        'Weighted median person AGI',\n",
+    "        'Weighted average person AGI',\n",
+    "        'Unweighted median household AGI',\n",
+    "        'Unweighted median person AGI',\n",
+    "        '25th percentile household AGI',\n",
+    "        '75th percentile household AGI',\n",
+    "        '90th percentile household AGI',\n",
+    "        '95th percentile household AGI',\n",
+    "        'Max household AGI',\n",
+    "        'Total households with children',\n",
+    "        'Households with 1 child',\n",
+    "        'Households with 2 children',\n",
+    "        'Households with 3+ children',\n",
+    "        'Total children under 18',\n",
+    "        'Children under 6',\n",
+    "        'Children under 3'\n",
+    "    ],\n",
+    "    'Value': [\n",
+    "        f\"{weighted_household_count:,.0f}\",\n",
+    "        f\"{weighted_person_count:,.0f}\",\n",
+    "        f\"{avg_hh_size:.1f}\",\n",
+    "        f\"${weighted_median_hh:,.0f}\",\n",
+    "        f\"${weighted_avg_hh:,.0f}\",\n",
+    "        f\"${weighted_median_person:,.0f}\",\n",
+    "        f\"${weighted_avg_person:,.0f}\",\n",
+    "        f\"${unweighted_median_hh:,.0f}\",\n",
+    "        f\"${unweighted_median_person:,.0f}\",\n",
+    "        f\"${weighted_percentile(agi_hh_array, hh_weights, 25):,.0f}\",\n",
+    "        f\"${weighted_percentile(agi_hh_array, hh_weights, 75):,.0f}\",\n",
+    "        f\"${weighted_percentile(agi_hh_array, hh_weights, 90):,.0f}\",\n",
+    "        f\"${weighted_percentile(agi_hh_array, hh_weights, 95):,.0f}\",\n",
+    "        f\"${agi_hh_array.max():,.0f}\",\n",
+    "        f\"{total_households_with_children:,.0f}\",\n",
+    "        f\"{households_with_1_child:,.0f}\",\n",
+    "        f\"{households_with_2_children:,.0f}\",\n",
+    "        f\"{households_with_3plus_children:,.0f}\",\n",
+    "        f\"{total_children:,.0f}\",\n",
+    "        f\"{children_under_6:,.0f}\",\n",
+    "        f\"{children_under_3:,.0f}\"\n",
+    "    ]\n",
+    "}\n",
+    "\n",
+    "summary_df = pd.DataFrame(summary_data)\n",
+    "\n",
+    "print(\"\\n\" + \"=\"*65)\n",
+    "print(\"SC DATASET SUMMARY - WEIGHTED (Population Estimates)\")\n",
+    "print(\"=\"*65)\n",
+    "print(summary_df.to_string(index=False))\n",
+    "print(\"=\"*65)\n",
+    "\n",
+    "# Save table\n",
+    "summary_df.to_csv('sc_dataset_summary_weighted.csv', index=False)\n",
+    "print(\"\\nSummary saved to: sc_dataset_summary_weighted.csv\")"
+   ]
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 8,
    "metadata": {},
-   "outputs": [],
-   "source": "# Households with $0 income - using raw arrays\nagi_hh = sim.calculate(\"adjusted_gross_income\", period=2025, map_to=\"household\").values\nweights = sim.calculate(\"household_weight\", period=2025).values\n\nzero_income_mask = agi_hh == 0\nzero_income_count = weights[zero_income_mask].sum()\ntotal_households = weights.sum()\n\nprint(\"\\n\" + \"=\"*70)\nprint(\"HOUSEHOLDS WITH $0 INCOME\")\nprint(\"=\"*70)\nprint(f\"Household count: {zero_income_count:,.0f}\")\nprint(f\"Percentage of all households: {zero_income_count / total_households * 100:.2f}%\")\nprint(\"=\"*70)"
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "======================================================================\n",
+      "HOUSEHOLDS WITH $0 INCOME\n",
+      "======================================================================\n",
+      "Household count: 179,119\n",
+      "Percentage of all households: 9.49%\n",
+      "======================================================================\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Households with $0 income - using raw arrays\n",
+    "agi_hh = sim.calculate(\"adjusted_gross_income\", period=2025, map_to=\"household\").values\n",
+    "weights = sim.calculate(\"household_weight\", period=2025).values\n",
+    "\n",
+    "zero_income_mask = agi_hh == 0\n",
+    "zero_income_count = weights[zero_income_mask].sum()\n",
+    "total_households = weights.sum()\n",
+    "\n",
+    "print(\"\\n\" + \"=\"*70)\n",
+    "print(\"HOUSEHOLDS WITH $0 INCOME\")\n",
+    "print(\"=\"*70)\n",
+    "print(f\"Household count: {zero_income_count:,.0f}\")\n",
+    "print(f\"Percentage of all households: {zero_income_count / total_households * 100:.2f}%\")\n",
+    "print(\"=\"*70)"
+   ]
   },
   {
    "cell_type": "code",
@@ -160,4 +476,4 @@
  },
  "nbformat": 4,
  "nbformat_minor": 4
-}
\ No newline at end of file
+}
diff --git a/us/states/sc/data_exploration_test.ipynb b/us/states/sc/data_exploration_test.ipynb
index 938545d..7f6b103 100644
--- a/us/states/sc/data_exploration_test.ipynb
+++ b/us/states/sc/data_exploration_test.ipynb
@@ -12,7 +12,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 1,
    "id": "cell-1",
    "metadata": {},
    "outputs": [],
@@ -26,7 +26,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 2,
    "id": "cell-2",
    "metadata": {},
    "outputs": [],
@@ -37,10 +37,20 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 3,
    "id": "cell-3",
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Number of households in dataset: 31,322\n",
+      "Household count (weighted): 1,844,111\n",
+      "Person count (weighted): 5,389,226\n"
+     ]
+    }
+   ],
    "source": [
     "# Check dataset size - use .values to get raw arrays (avoid MicroSeries auto-weighting)\n",
     "household_weight = sim.calculate(\"household_weight\", period=2025).values\n",
@@ -58,10 +68,40 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 4,
    "id": "cell-4",
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "============================================================\n",
+      "INCOME DISTRIBUTION SUMMARY\n",
+      "============================================================\n",
+      "\n",
+      "Household AGI:\n",
+      "  Unweighted median: $57,308\n",
+      "  Weighted median:   $34,927\n",
+      "  Weighted average:  $74,061\n",
+      "\n",
+      "Person AGI:\n",
+      "  Unweighted median: $58,750\n",
+      "  Weighted median:   $34,911\n",
+      "  Weighted average:  $78,962\n",
+      "\n",
+      "Average household size: 2.9\n",
+      "\n",
+      "Weighted household AGI percentiles:\n",
+      "  25th percentile: $2,489\n",
+      "  50th percentile: $34,927\n",
+      "  75th percentile: $86,301\n",
+      "  90th percentile: $140,239\n",
+      "  95th percentile: $236,759\n",
+      "  Max AGI: $418,650,960\n"
+     ]
+    }
+   ],
    "source": [
     "# Check income distribution (weighted vs unweighted, household and person level)\n",
     "# Use .values to get raw numpy arrays (avoid MicroSeries auto-weighting)\n",
@@ -123,10 +163,23 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 5,
    "id": "cell-5",
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "Households with children (weighted):\n",
+      "  Total households with children: 663,513\n",
+      "  Households with 1 child: 303,647\n",
+      "  Households with 2 children: 209,804\n",
+      "  Households with 3+ children: 150,062\n"
+     ]
+    }
+   ],
    "source": [
     "# Check households with children - use .values for raw arrays\n",
     "is_child = sim.calculate(\"is_child\", period=2025, map_to=\"person\").values\n",
@@ -161,10 +214,22 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 6,
    "id": "cell-6",
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "Children by age:\n",
+      "  Total children under 18: 1,247,050\n",
+      "  Children under 6: 361,890\n",
+      "  Children under 3: 177,869\n"
+     ]
+    }
+   ],
    "source": [
     "# Check children by age groups - use .values for raw arrays\n",
     "df = pd.DataFrame({\n",
@@ -193,10 +258,46 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 7,
    "id": "cell-7",
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "=================================================================\n",
+      "SC TEST DATASET SUMMARY - WEIGHTED (Population Estimates)\n",
+      "=================================================================\n",
+      "                         Metric        Value\n",
+      "     Household count (weighted)    1,844,111\n",
+      "        Person count (weighted)    5,389,226\n",
+      "         Average household size          2.9\n",
+      "  Weighted median household AGI      $34,927\n",
+      " Weighted average household AGI      $74,061\n",
+      "     Weighted median person AGI      $34,911\n",
+      "    Weighted average person AGI      $78,962\n",
+      "Unweighted median household AGI      $57,308\n",
+      "   Unweighted median person AGI      $58,750\n",
+      "  25th percentile household AGI       $2,489\n",
+      "  75th percentile household AGI      $86,301\n",
+      "  90th percentile household AGI     $140,239\n",
+      "  95th percentile household AGI     $236,759\n",
+      "              Max household AGI $418,650,960\n",
+      " Total households with children      663,513\n",
+      "        Households with 1 child      303,647\n",
+      "     Households with 2 children      209,804\n",
+      "    Households with 3+ children      150,062\n",
+      "        Total children under 18    1,247,050\n",
+      "               Children under 6      361,890\n",
+      "               Children under 3      177,869\n",
+      "=================================================================\n",
+      "\n",
+      "Summary saved to: sc_test_dataset_summary_weighted.csv\n"
+     ]
+    }
+   ],
    "source": [
     "# Create comprehensive summary table\n",
     "summary_data = {\n",
@@ -263,10 +364,24 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 8,
    "id": "cell-8",
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "======================================================================\n",
+      "HOUSEHOLDS WITH $0 INCOME\n",
+      "======================================================================\n",
+      "Household count: 227,976\n",
+      "Percentage of all households: 12.36%\n",
+      "======================================================================\n"
+     ]
+    }
+   ],
    "source": [
     "# Households with $0 income - using raw arrays\n",
     "agi_hh = sim.calculate(\"adjusted_gross_income\", period=2025, map_to=\"household\").values\n",
@@ -286,10 +401,32 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 9,
    "id": "cell-9",
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "======================================================================\n",
+      "HOUSEHOLD COUNTS BY INCOME BRACKET\n",
+      "======================================================================\n",
+      "Income Bracket Households % of All Households\n",
+      "       $0-$10k    553,836              30.03%\n",
+      "     $10k-$20k    158,183               8.58%\n",
+      "     $20k-$30k    131,263               7.12%\n",
+      "     $30k-$40k    113,749               6.17%\n",
+      "     $40k-$50k    101,002               5.48%\n",
+      "     $50k-$60k     98,917               5.36%\n",
+      "======================================================================\n",
+      "\n",
+      "Total households in $0-$60k range: 1,156,950\n",
+      "Percentage of all households in $0-$60k range: 62.74%\n"
+     ]
+    }
+   ],
    "source": [
     "# Household counts by income brackets\n",
     "income_brackets = [\n",
@@ -335,8 +472,16 @@
    "name": "python3"
   },
   "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
    "name": "python",
-   "version": "3.11.0"
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.11.5"
   }
  },
  "nbformat": 4,
diff --git a/us/states/sc/h4216_analysis_comparison.md b/us/states/sc/h4216_analysis_comparison.md
index d4a235a..3728b32 100644
--- a/us/states/sc/h4216_analysis_comparison.md
+++ b/us/states/sc/h4216_analysis_comparison.md
@@ -2,198 +2,173 @@
 
 ## Executive Summary
 
-**UPDATE (Feb 2025):** PR #7514 fixed a bug where `sc_additions` (QBI and SALT addbacks) were incorrectly applied under H.4216. Since H.4216 starts from AGI (before federal deductions), addbacks are inappropriate. With this fix, PolicyEngine estimates approximately **-$110.9M** vs RFA's **-$119.1M** (~93% accuracy).
+**UPDATE (March 2025):** After PR #7514 fix and testing multiple datasets:
+
+| Dataset | 5.21% Impact | vs RFA (-$309M) | 5.39% Impact | vs RFA (-$119M) |
+|---------|--------------|-----------------|--------------|-----------------|
+| **Production** | -$393M | 73% accuracy | -$198M | 34% accuracy |
+| **Test (Mar)** | -$212M | 69% accuracy | -$93M | 78% accuracy |
+| **RFA** | -$309M | - | -$119M | - |
+
+**Key Finding:** Neither dataset consistently matches RFA. Production overestimates cuts, Test underestimates them. The core issue is baseline revenue calibration.
 
 ---
 
-### Original Analysis (Pre-Fix)
+## Dataset Comparison
 
-The original $159M difference between PolicyEngine (+$39.8M) and RFA (-$119.1M) was driven by:
-1. **Bug**: `sc_additions` were being applied when starting from AGI (fixed in PR #7514)
-2. **Different income distributions** in the underlying data
+### Overview
 
-## Summary
-
-| Metric | RFA | PolicyEngine | Difference |
-|--------|-----|--------------|------------|
-| **General Fund Impact** | **-$119.1M** | **+$39.8M** | **+$158.9M** |
-| Total Returns | 2,757,573 | 2,935,621 | +178,048 |
-| Tax Decrease % | 38.7% | 20.0% | -18.7pp |
-| Tax Increase % | 26.7% | 24.0% | -2.7pp |
-| No Change % | 34.6% | 56.0% | +21.4pp |
+| Metric | Production | Test | RFA |
+|--------|------------|------|-----|
+| **Tax Units** | 2,935,621 | 2,705,850 | 2,757,573 |
+| **Baseline Revenue** | $6.5B | $4.0B | ~$6.4B |
+| **Median HH AGI** | $43,222 | $34,927 | N/A |
+| **Avg HH AGI** | $103,858 | $74,061 | N/A |
+| **25th Percentile AGI** | $9,425 | $2,489 | N/A |
+| **Max AGI** | $6.4M | $418.7M | N/A |
 
-## Top 5 Discrepancies by Income Bracket
+### Budget Impact Comparison
 
-| AGI Range | RFA Impact | PE Impact | Difference |
-|-----------|------------|-----------|------------|
-| Over $1,000,000 | -$13.8M | -$115.3M | -$101.5M |
-| $50,001-$75,000 | -$82.1M | -$23.3M | +$58.9M |
-| $100,001-$150,000 | +$3.1M | +$53.4M | +$50.3M |
-| $300,001-$500,000 | -$4.6M | +$40.6M | +$45.3M |
-| $500,001-$1,000,000 | -$16.2M | +$18.7M | +$34.9M |
+| Rate | Production | Test | RFA | Best Match |
+|------|------------|------|-----|------------|
+| **5.21%** | -$393M | -$212M | -$309M | Production (73%) |
+| **5.39%** | -$198M | -$93M | -$119M | Test (78%) |
 
-## Key Differences Explaining the $159M Gap
+---
 
-### 1. Upper-Middle Income ($100k-$500k): PE Shows Much Larger Tax Increases
+## Why Production OVERESTIMATES
 
-| Bracket | RFA Avg Change | PE Avg Change | Direction |
-|---------|----------------|---------------|-----------|
-| $100k-$150k | +$11 | +$284 | Both increase, PE 25x larger |
-| $150k-$200k | +$355 | +$727 | Both increase, PE 2x larger |
-| $300k-$500k | **-$82** | **+$1,099** | RFA: decrease, PE: increase |
-| $500k-$1M | **-$631** | **+$1,129** | RFA: decrease, PE: increase |
+Production estimates -$198M vs RFA's -$119M at 5.39% rate (**67% over**)
 
-**This is the primary driver of the difference.** PolicyEngine shows significant tax INCREASES in the $100k-$500k range where RFA shows small increases or even decreases.
+### 1. Higher Average Incomes
+- Production median AGI: **$43,222** vs Test $34,927
+- Production avg AGI: **$103,858** vs Test $74,061
+- More high earners = larger tax cuts when rates drop
 
-### 2. Middle Income ($30k-$100k): PE Shows Smaller Tax Cuts
+### 2. Higher Baseline Revenue
+- Production: **$6.5B** baseline revenue
+- Test: $4.0B baseline revenue
+- Production has **63% more** baseline revenue than Test
+- Bigger revenue base = bigger absolute cuts
 
-| Bracket | RFA Avg Change | PE Avg Change |
-|---------|----------------|---------------|
-| $30k-$40k | -$72 | -$23 |
-| $40k-$50k | -$179 | -$135 |
-| $50k-$75k | -$202 | -$77 |
-| $75k-$100k | -$146 | -$71 |
+### 3. More Tax Units Than RFA
+- Production: 2,935,621 tax units
+- RFA: 2,757,573 filers
+- **+178,048 extra units** (6.5% more)
+- Includes non-filers with imputed income
 
-RFA shows 2-3x larger tax cuts in these brackets.
+### 4. Fewer Low-Income Units
+- Production 25th percentile: **$9,425**
+- Test 25th percentile: $2,489
+- Production has fewer truly low-income/zero-tax units
+- More taxpayers affected by rate changes
 
-### 3. Over $1M: PE Shows Much Larger Tax Cuts
+---
 
-| Metric | RFA | PE |
-|--------|-----|-----|
-| Avg Change | -$1,154 | -$5,082 |
-| Total Impact | -$13.8M | -$115.3M |
+## Why Test UNDERESTIMATES
 
-PE shows 4-8x larger tax cuts for millionaires, but with more returns (22,686 vs 11,936).
+Test estimates -$93M vs RFA's -$119M at 5.39% rate (**22% under**)
 
-### 4. Low Income ($0-$30k): Different Tax Bases
+### 1. Lower Baseline Revenue
+- Test: **$4.0B** baseline revenue
+- RFA: ~$6.4B estimated baseline
+- Test has **37% less** revenue than RFA
+- Smaller revenue base = smaller absolute cuts
 
-RFA shows existing tax liability for low-income filers ($50, $3, $16, $107 avg), while PE shows $0 for most low-income brackets. This suggests:
-- Different baseline calculations
-- Different treatment of non-filers
-- CPS data may underrepresent low-income tax filers
+### 2. Lower Average Incomes
+- Test avg AGI: **$74,061** vs Production $103,858
+- Fewer high-income taxpayers paying significant taxes
+- Smaller tax liabilities to cut
 
-## Return Count Comparison (Key Finding)
+### 3. Extreme Outlier at Top
+- Test max AGI: **$418.7M** (single household)
+- Production max: $6.4M
+- One extreme outlier may distort millionaire calculations
+- Could skew average tax calculations
 
-| AGI Range | RFA Returns | PE Returns | PE/RFA Ratio |
-|-----------|-------------|------------|--------------|
-| $0* | 78,854 | 619,009 | **7.85x** |
-| $1-$10k | 286,253 | 502,276 | 1.75x |
-| $10k-$20k | 310,122 | 279,412 | 0.90x |
-| $20k-$30k | 275,560 | 252,862 | 0.92x |
-| $30k-$40k | 269,566 | 215,980 | 0.80x |
-| $40k-$50k | 234,386 | 197,525 | 0.84x |
-| $50k-$75k | 407,593 | 300,857 | **0.74x** |
-| $75k-$100k | 250,437 | 177,284 | **0.71x** |
-| $100k-$150k | 298,343 | 187,945 | **0.63x** |
-| $150k-$200k | 143,398 | 73,396 | **0.51x** |
-| $200k-$300k | 109,340 | 52,882 | **0.48x** |
-| $300k-$500k | 56,123 | 36,977 | 0.66x |
-| $500k-$1M | 25,664 | 16,525 | 0.64x |
-| Over $1M | 11,936 | 22,686 | **1.90x** |
-| **Total** | **2,757,573** | **2,935,621** | 1.06x |
+### 4. More Low-Income Units
+- Test 25th percentile AGI: **$2,489**
+- Production 25th percentile: $9,425
+- More zero-tax units diluting the weighted averages
+- More units unaffected by rate changes
 
-**Key observations:**
-- PE has **7.85x more** $0 income returns - **PE counts all tax units (including non-filers), RFA only counts actual filers**
-- PE has **~50% fewer** returns in $100k-$300k brackets
-- PE has **1.9x more** millionaire returns
+---
+
+## The Core Issue: Baseline Revenue Calibration
 
-**Important note:** RFA uses actual SC tax return data (filers only). PolicyEngine uses CPS-based data representing all tax units regardless of filing status. This explains the large discrepancy in low-income brackets where many households don't file.
+| Source | Baseline Revenue | vs RFA |
+|--------|------------------|--------|
+| **RFA** | ~$6.4B | - |
+| **Production** | $6.5B | **+2%** |
+| **Test** | $4.0B | **-37%** |
 
-## Baseline Tax Liability Comparison
+### What Each Dataset Gets Right/Wrong
 
-| AGI Range | RFA Avg Tax | PE Avg Tax | Difference |
-|-----------|-------------|------------|------------|
-| $0-$10k | $3-$50 | $0 | PE shows no tax |
-| $50k-$75k | $1,192 | $822 | PE 31% lower |
-| $100k-$150k | $3,258 | $3,292 | Similar |
-| Over $1M | $78,228 | **$139,623** | PE **78% higher** |
+**Production Dataset:**
+- ✅ Matches RFA baseline revenue (~$6.5B)
+- ❌ Wrong income distribution (too many high earners)
+- ❌ Overestimates tax cuts at all rates
 
-## Total Baseline Revenue Comparison
+**Test Dataset:**
+- ✅ Better return count (2.71M vs 2.76M RFA)
+- ❌ Severely underestimates baseline revenue ($4B vs $6.4B)
+- ❌ Underestimates tax cuts at all rates
 
-| Bracket | RFA Revenue | PE Revenue | Difference |
-|---------|-------------|------------|------------|
-| $0-$100k | $1.24B | $0.74B | -$0.50B |
-| $100k-$1M | $4.22B | $2.61B | -$1.61B |
-| Over $1M | $0.93B | **$3.17B** | **+$2.23B** |
-| **Total** | **$6.40B** | **$6.52B** | +$0.12B (+1.8%) |
+### Ideal Dataset Would Have:
+- Test's return count (~2.7M matching RFA's 2.76M filers)
+- Production's baseline revenue (~$6.5B matching RFA's ~$6.4B)
+- RFA's millionaire distribution (11,936 returns over $1M)
 
-**Critical insight:** Total baseline revenue is similar, but PE derives **48%** of SC income tax from millionaires vs RFA's **15%**.
+---
 
-## Likely Causes
+## Technical Details
 
-### 1. Implementation Details (from PR #7494)
+### PR #7514 Fix (February 2025)
+
+Fixed bug where `sc_additions` (QBI and SALT addbacks) were incorrectly applied under H.4216. Since H.4216 starts from AGI (before federal deductions), addbacks are inappropriate.
+
+**Before fix:** +$39.8M (wrong direction)
+**After fix:** -$93M to -$198M depending on dataset
+
+### H.4216 Reform Structure
 
 **Baseline SC Taxable Income:**
-```python
+```
 taxable_income = federal_taxable_income + sc_additions - sc_subtractions
 ```
-Where `federal_taxable_income` = AGI - standard/itemized deduction - QBI deduction
 
 **H.4216 SC Taxable Income:**
-```python
-taxable_income = AGI + sc_additions - sc_subtractions - SCIAD
 ```
-Where SCIAD phases out from $40k-$190k AGI (varies by filing status)
+taxable_income = AGI - sc_subtractions - SCIAD
+```
 
-**Key Insight**: The reform switches from using federal taxable income (after federal deductions) to using AGI minus SCIAD. For taxpayers who itemize large deductions or have QBI deductions, this could result in HIGHER taxable income under H.4216.
+**Rate Structure:**
+- Current: 0% up to $3,640, 3% $3,640-$18,230, 6% over $18,230
+- H.4216: 1.99% up to $30,000, 5.21%/5.39% over $30,000
 
-### 2. SCIAD Phase-out Creates Winners and Losers
+### SCIAD Phase-out
 
-| Filing Status | SCIAD Amount | Phase-out Start | Phase-out End |
-|---------------|--------------|-----------------|---------------|
+| Filing Status | Amount | Phase-out Start | Phase-out End |
+|---------------|--------|-----------------|---------------|
 | Single | $15,000 | $40,000 | $95,000 |
 | MFJ | $30,000 | $80,000 | $190,000 |
 | HoH | $22,500 | $60,000 | $142,500 |
 
-For taxpayers above phase-out thresholds with SCIAD = $0:
-- If their federal deduction was > $0, they lose that deduction entirely
-- This explains why PE shows large tax INCREASES for $100k-$500k brackets
-
-### 3. Baseline Tax Differences
-PE baseline avg tax ($2,220) is lower than RFA ($2,321), suggesting different starting points for current law calculations.
-
-### 4. Data Source Differences
-- **RFA**: SC Department of Revenue 2024 tax returns (95% sample, inflated to 100%)
-- **PE**: CPS-based synthetic data for South Carolina
-
-Tax return data captures actual filers with precise income/deduction information. CPS-based data may:
-- Over/underrepresent certain income groups
-- Miss nuances in itemized vs standard deduction usage
-- Have different filing status distributions
-
-### 5. Federal Deduction Treatment
-H.4216 eliminates federal standard/itemized deductions. The impact depends heavily on:
-- Current deduction amounts by income level
-- How many taxpayers itemize vs take standard deduction
-- QBI deduction amounts (not replaced by SCIAD)
-
-RFA has actual deduction data; PE estimates from CPS.
-
-## Net Effect
-
-The $159M difference primarily comes from:
-1. **+$140M**: PE shows larger tax increases in $100k-$500k brackets
-2. **+$59M**: PE shows smaller tax cuts in $30k-$100k brackets
-3. **-$102M**: PE shows larger tax cuts for over $1M bracket
-4. **+$60M**: Various other bracket differences
-
-**Bottom line**: PolicyEngine's model shows the SCIAD phase-out creating more tax increases for upper-middle income taxpayers than RFA estimates, which more than offsets the tax cuts elsewhere.
-
-## Conclusion
-
-The $159M difference is **not primarily a calculation issue** but stems from:
-
-1. **Different populations**: PE counts all tax units (filers + non-filers), RFA counts only actual filers. This explains 540k extra returns in the $0 bracket.
-
-2. **Different income distributions**: PE's CPS-based data has far more millionaires (22.7k vs 12k) paying much higher average taxes ($140k vs $78k)
+---
 
-3. **Different return counts**: PE undercounts middle-income filers ($50k-$300k) by 40-50%
+## Recommendations
 
-4. **Millionaire impact drives divergence**: H.4216 gives large tax cuts to millionaires. With PE having 2x more millionaires paying 2x higher taxes, the reform's impact on this group dominates.
+### For Data Team:
+1. Investigate why Test dataset has only $4B baseline revenue vs $6.4B actual
+2. Recalibrate weights to match SC tax filer distribution
+3. Validate millionaire counts against IRS SOI data
 
-### Recommendation
+### For Analysis:
+1. Use Production for directional analysis (correct baseline revenue)
+2. Use Test for return count validation (closer to RFA filer count)
+3. Report range of estimates: -$93M to -$198M for 5.39% rate
 
-To align with RFA, PolicyEngine would need to:
-- Recalibrate SC state weights to match actual tax return distributions
-- Validate millionaire counts and income levels against IRS SOI data
-- Investigate why baseline tax for millionaires is so much higher than RFA
+### For Reporting:
+- RFA 5.39% estimate: **-$119.1M**
+- RFA 5.21% estimate: **-$309.0M**
+- PE best estimates: **-$93M to -$198M** (5.39%), **-$212M to -$393M** (5.21%)
diff --git a/us/states/sc/pe_h4216_test_analysis.csv b/us/states/sc/pe_h4216_test_analysis.csv
new file mode 100644
index 0000000..30e7d02
--- /dev/null
+++ b/us/states/sc/pe_h4216_test_analysis.csv
@@ -0,0 +1,16 @@
+Federal AGI Range,Est # Returns,Est % Returns,Old Avg Tax Liability,New Avg Tax Liability,Returns with Tax Change,% Returns in Range with Change,Old Avg Tax (Changed),New Avg Tax (Changed),Avg Tax Change,Total Dollar Change,Tax Decrease # Returns,Tax Decrease % in Range,Total Decrease Amount,Avg Decrease Amount,Tax Increase # Returns,Tax Increase % in Range,Total Increase Amount,Avg Increase Amount,No Tax Change # Returns,No Change % Returns,Zero Tax # Returns,Zero Tax % Returns
+$0*,727881,26.9%,$0,$0,0,0.0%,$0,$0,$0,$0,0,0.0%,$0,$0,0,0.0%,$0,$0,727881,100.0%,727881,100.0%
+$1 to $10000,498186,18.4%,$0,$0,0,0.0%,$0,$0,$0,$0,0,0.0%,$0,$0,0,0.0%,$0,$0,498186,100.0%,498186,100.0%
+$10001 to $20000,233000,8.6%,$0,$4,16527,7.1%,$0,$51,$51,$847688,0,0.0%,$0,$0,16527,7.1%,$847510,$51,216473,92.9%,215471,92.5%
+$20001 to $30000,171515,6.3%,$40,$56,48979,28.6%,$131,$187,$56,$2756262,2691,1.6%,$-22726,$-8,46288,27.0%,$2778858,$60,122536,71.4%,121168,70.6%
+$30001 to $40000,157010,5.8%,$149,$135,70118,44.7%,$333,$302,$-31,$-2140517,45821,29.2%,$-3836658,$-84,24298,15.5%,$1696106,$70,86892,55.3%,86762,55.3%
+$40001 to $50000,132402,4.9%,$399,$302,95777,72.3%,$548,$414,$-134,$-12807614,49802,37.6%,$-16610524,$-334,45975,34.7%,$3801858,$83,36624,27.7%,35193,26.6%
+$50001 to $75000,245406,9.1%,$701,$584,205399,83.7%,$836,$697,$-139,$-28577564,139789,57.0%,$-38644192,$-276,65610,26.7%,$10066116,$153,40008,16.3%,39028,15.9%
+$75001 to $100000,165713,6.1%,$1452,$1290,163884,98.9%,$1468,$1305,$-163,$-26753744,118394,71.4%,$-40121352,$-339,45491,27.5%,$13367631,$294,1829,1.1%,1759,1.1%
+$100001 to $150000,225396,8.3%,$2929,$3149,220578,97.9%,$2991,$3216,$225,$49609656,92356,41.0%,$-12660524,$-137,128222,56.9%,$62270140,$486,4818,2.1%,4765,2.1%
+$150001 to $200000,42792,1.6%,$5236,$5998,42792,100.0%,$5236,$5998,$762,$32593342,879,2.1%,$-318522,$-362,41913,97.9%,$32911862,$785,0,0.0%,0,0.0%
+$200001 to $300000,55391,2.0%,$9952,$10461,55391,100.0%,$9952,$10461,$509,$28205350,3638,6.6%,$-353202,$-97,51753,93.4%,$28558554,$552,0,0.0%,0,0.0%
+$300001 to $500000,32748,1.2%,$16226,$15952,32748,100.0%,$16226,$15952,$-273,$-8944396,23765,72.6%,$-13389474,$-563,8983,27.4%,$4445078,$495,0,0.0%,0,0.0%
+$500001 to $1000000,11418,0.4%,$31912,$29991,11417,100.0%,$31913,$29992,$-1921,$-21936012,11383,99.7%,$-22036886,$-1936,35,0.3%,$100874,$2922,0,0.0%,0,0.0%
+Over $1000000,6993,0.3%,$171527,$156431,6993,100.0%,$171530,$156433,$-15096,$-105563360,6959,99.5%,$-111170816,$-15974,33,0.5%,$5607453,$167720,0,0.0%,0,0.0%
+Total,2705850,100.0%,$1488,$1454,970603,35.9%,$4147,$4051,$-96,$-92710912,495476,18.3%,$-259164880,$-523,475127,17.6%,$166452032,$350,1735247,64.1%,1730213,63.9%
diff --git a/us/states/sc/sc_h4216_test_analysis.ipynb b/us/states/sc/sc_h4216_test_analysis.ipynb
index 95e1d55..65013a1 100644
--- a/us/states/sc/sc_h4216_test_analysis.ipynb
+++ b/us/states/sc/sc_h4216_test_analysis.ipynb
@@ -16,7 +16,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 1,
    "id": "cell-1",
    "metadata": {},
    "outputs": [],
@@ -33,10 +33,19 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 2,
    "id": "cell-2",
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Loading simulations...\n",
+      "Done!\n"
+     ]
+    }
+   ],
    "source": [
     "def create_h4216_reform(top_rate=0.0539):\n",
     "    \"\"\"\n",
@@ -66,10 +75,19 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 3,
    "id": "cell-3",
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Total tax units: 42,461\n",
+      "Weighted tax units: 2,705,850\n"
+     ]
+    }
+   ],
    "source": [
     "# Get data - use .values to avoid double-weighting\n",
     "baseline_tax = baseline.calculate(\"sc_income_tax\", period=TAX_YEAR, map_to=\"tax_unit\").values\n",
@@ -85,10 +103,18 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 4,
    "id": "cell-4",
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Bracket analysis complete!\n"
+     ]
+    }
+   ],
    "source": [
     "# Define income brackets matching RFA exactly\n",
     "income_brackets = [\n",
@@ -200,10 +226,18 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 5,
    "id": "cell-5",
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Totals calculated!\n"
+     ]
+    }
+   ],
    "source": [
     "# Calculate totals\n",
     "change_mask_all = np.abs(tax_change) > 1\n",
@@ -264,10 +298,28 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 6,
    "id": "cell-6",
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "====================================================================================================\n",
+      "H.4216 - POLICYENGINE ANALYSIS (Test Dataset, 5.39% Top Rate)\n",
+      "====================================================================================================\n",
+      "\n",
+      "Total Returns: 2,705,849\n",
+      "General Fund Impact: $-92,710,912\n",
+      "\n",
+      "RFA Estimate: -$119,100,000\n",
+      "Difference: $26,389,088\n",
+      "Accuracy: 77.8%\n",
+      "====================================================================================================\n"
+     ]
+    }
+   ],
    "source": [
     "# Display summary\n",
     "print(\"=\"*100)\n",
@@ -283,10 +335,18 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 7,
    "id": "cell-7",
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Exported to: pe_h4216_test_analysis.csv\n"
+     ]
+    }
+   ],
    "source": [
     "# Export to CSV in RFA format\n",
     "df_results.to_csv('pe_h4216_test_analysis.csv', index=False)\n",
@@ -295,10 +355,35 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 8,
    "id": "cell-8",
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "KEY METRICS:\n",
+      "  Federal AGI Range  Est # Returns Est % Returns Old Avg Tax Liability New Avg Tax Liability Total Dollar Change\n",
+      "                $0*         727881         26.9%                    $0                    $0                  $0\n",
+      "       $1 to $10000         498186         18.4%                    $0                    $0                  $0\n",
+      "   $10001 to $20000         233000          8.6%                    $0                    $4             $847688\n",
+      "   $20001 to $30000         171515          6.3%                   $40                   $56            $2756262\n",
+      "   $30001 to $40000         157010          5.8%                  $149                  $135           $-2140517\n",
+      "   $40001 to $50000         132402          4.9%                  $399                  $302          $-12807614\n",
+      "   $50001 to $75000         245406          9.1%                  $701                  $584          $-28577564\n",
+      "  $75001 to $100000         165713          6.1%                 $1452                 $1290          $-26753744\n",
+      " $100001 to $150000         225396          8.3%                 $2929                 $3149           $49609656\n",
+      " $150001 to $200000          42792          1.6%                 $5236                 $5998           $32593342\n",
+      " $200001 to $300000          55391          2.0%                 $9952                $10461           $28205350\n",
+      " $300001 to $500000          32748          1.2%                $16226                $15952           $-8944396\n",
+      "$500001 to $1000000          11418          0.4%                $31912                $29991          $-21936012\n",
+      "      Over $1000000           6993          0.3%               $171527               $156431         $-105563360\n",
+      "              Total        2705850        100.0%                 $1488                 $1454          $-92710912\n"
+     ]
+    }
+   ],
    "source": [
     "# Display key columns for quick comparison\n",
     "display_cols = [\n",
@@ -319,10 +404,38 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 9,
    "id": "cell-10",
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "====================================================================================================\n",
+      "POLICYENGINE vs RFA COMPARISON\n",
+      "====================================================================================================\n",
+      "          AGI Range PE Returns RFA Returns     PE Impact    RFA Impact         Diff\n",
+      "                $0*    727,881      78,854            $0     $-571,000    $+571,000\n",
+      "       $1 to $10000    498,186     286,253            $0    $1,655,000  $-1,655,000\n",
+      "   $10001 to $20000    233,000     310,122      $847,688    $2,872,000  $-2,024,312\n",
+      "   $20001 to $30000    171,515     275,560    $2,756,262      $769,000  $+1,987,262\n",
+      "   $30001 to $40000    157,010     269,566   $-2,140,517  $-19,360,000 $+17,219,483\n",
+      "   $40001 to $50000    132,402     234,386  $-12,807,614  $-41,986,000 $+29,178,386\n",
+      "   $50001 to $75000    245,406     407,593  $-28,577,564  $-82,146,000 $+53,568,436\n",
+      "  $75001 to $100000    165,713     250,437  $-26,753,744  $-36,461,000  $+9,707,256\n",
+      " $100001 to $150000    225,396     298,343   $49,609,656    $3,115,000 $+46,494,656\n",
+      " $150001 to $200000     42,792     143,398   $32,593,342   $50,933,000 $-18,339,658\n",
+      " $200001 to $300000     55,391     109,340   $28,205,350   $36,718,000  $-8,512,650\n",
+      " $300001 to $500000     32,748      56,123   $-8,944,396   $-4,627,000  $-4,317,396\n",
+      "$500001 to $1000000     11,418      25,664  $-21,936,012  $-16,195,000  $-5,741,012\n",
+      "      Over $1000000      6,993      11,936 $-105,563,360  $-13,767,000 $-91,796,360\n",
+      "              Total  2,705,850   2,757,573  $-92,710,912 $-119,100,000 $+26,389,088\n",
+      "====================================================================================================\n"
+     ]
+    }
+   ],
    "source": [
     "# Load RFA data\n",
     "rfa_df = pd.read_csv('rfa_h4216_analysis.csv')\n",
@@ -372,10 +485,37 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 10,
    "id": "cell-11",
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "========================================================================================================================\n",
+      "FULL POLICYENGINE ANALYSIS (RFA Format)\n",
+      "========================================================================================================================\n",
+      "  Federal AGI Range  Est # Returns Est % Returns Old Avg Tax Liability New Avg Tax Liability  Returns with Tax Change % Returns in Range with Change Old Avg Tax (Changed) New Avg Tax (Changed) Avg Tax Change Total Dollar Change  Tax Decrease # Returns Tax Decrease % in Range Total Decrease Amount Avg Decrease Amount  Tax Increase # Returns Tax Increase % in Range Total Increase Amount Avg Increase Amount  No Tax Change # Returns No Change % Returns  Zero Tax # Returns Zero Tax % Returns\n",
+      "                $0*         727881         26.9%                    $0                    $0                        0                           0.0%                    $0                    $0             $0                  $0                       0                    0.0%                    $0                  $0                       0                    0.0%                    $0                  $0                   727881              100.0%              727881             100.0%\n",
+      "       $1 to $10000         498186         18.4%                    $0                    $0                        0                           0.0%                    $0                    $0             $0                  $0                       0                    0.0%                    $0                  $0                       0                    0.0%                    $0                  $0                   498186              100.0%              498186             100.0%\n",
+      "   $10001 to $20000         233000          8.6%                    $0                    $4                    16527                           7.1%                    $0                   $51            $51             $847688                       0                    0.0%                    $0                  $0                   16527                    7.1%               $847510                 $51                   216473               92.9%              215471              92.5%\n",
+      "   $20001 to $30000         171515          6.3%                   $40                   $56                    48979                          28.6%                  $131                  $187            $56            $2756262                    2691                    1.6%               $-22726                 $-8                   46288                   27.0%              $2778858                 $60                   122536               71.4%              121168              70.6%\n",
+      "   $30001 to $40000         157010          5.8%                  $149                  $135                    70118                          44.7%                  $333                  $302           $-31           $-2140517                   45821                   29.2%             $-3836658                $-84                   24298                   15.5%              $1696106                 $70                    86892               55.3%               86762              55.3%\n",
+      "   $40001 to $50000         132402          4.9%                  $399                  $302                    95777                          72.3%                  $548                  $414          $-134          $-12807614                   49802                   37.6%            $-16610524               $-334                   45975                   34.7%              $3801858                 $83                    36624               27.7%               35193              26.6%\n",
+      "   $50001 to $75000         245406          9.1%                  $701                  $584                   205399                          83.7%                  $836                  $697          $-139          $-28577564                  139789                   57.0%            $-38644192               $-276                   65610                   26.7%             $10066116                $153                    40008               16.3%               39028              15.9%\n",
+      "  $75001 to $100000         165713          6.1%                 $1452                 $1290                   163884                          98.9%                 $1468                 $1305          $-163          $-26753744                  118394                   71.4%            $-40121352               $-339                   45491                   27.5%             $13367631                $294                     1829                1.1%                1759               1.1%\n",
+      " $100001 to $150000         225396          8.3%                 $2929                 $3149                   220578                          97.9%                 $2991                 $3216           $225           $49609656                   92356                   41.0%            $-12660524               $-137                  128222                   56.9%             $62270140                $486                     4818                2.1%                4765               2.1%\n",
+      " $150001 to $200000          42792          1.6%                 $5236                 $5998                    42792                         100.0%                 $5236                 $5998           $762           $32593342                     879                    2.1%              $-318522               $-362                   41913                   97.9%             $32911862                $785                        0                0.0%                   0               0.0%\n",
+      " $200001 to $300000          55391          2.0%                 $9952                $10461                    55391                         100.0%                 $9952                $10461           $509           $28205350                    3638                    6.6%              $-353202                $-97                   51753                   93.4%             $28558554                $552                        0                0.0%                   0               0.0%\n",
+      " $300001 to $500000          32748          1.2%                $16226                $15952                    32748                         100.0%                $16226                $15952          $-273           $-8944396                   23765                   72.6%            $-13389474               $-563                    8983                   27.4%              $4445078                $495                        0                0.0%                   0               0.0%\n",
+      "$500001 to $1000000          11418          0.4%                $31912                $29991                    11417                         100.0%                $31913                $29992         $-1921          $-21936012                   11383                   99.7%            $-22036886              $-1936                      35                    0.3%               $100874               $2922                        0                0.0%                   0               0.0%\n",
+      "      Over $1000000           6993          0.3%               $171527               $156431                     6993                         100.0%               $171530               $156433        $-15096         $-105563360                    6959                   99.5%           $-111170816             $-15974                      33                    0.5%              $5607453             $167720                        0                0.0%                   0               0.0%\n",
+      "              Total        2705850        100.0%                 $1488                 $1454                   970603                          35.9%                 $4147                 $4051           $-96          $-92710912                  495476                   18.3%           $-259164880               $-523                  475127                   17.6%            $166452032                $350                  1735247               64.1%             1730213              63.9%\n"
+     ]
+    }
+   ],
    "source": [
     "# Full results table\n",
     "print(\"\\n\" + \"=\"*120)\n",
@@ -394,8 +534,16 @@
    "name": "python3"
   },
   "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
    "name": "python",
-   "version": "3.11.0"
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.11.5"
   }
  },
  "nbformat": 4,
diff --git a/us/states/sc/sc_test_dataset_summary_weighted.csv b/us/states/sc/sc_test_dataset_summary_weighted.csv
new file mode 100644
index 0000000..e5cc13e
--- /dev/null
+++ b/us/states/sc/sc_test_dataset_summary_weighted.csv
@@ -0,0 +1,22 @@
+Metric,Value
+Household count (weighted),"1,844,111"
+Person count (weighted),"5,389,226"
+Average household size,2.9
+Weighted median household AGI,"$34,927"
+Weighted average household AGI,"$74,061"
+Weighted median person AGI,"$34,911"
+Weighted average person AGI,"$78,962"
+Unweighted median household AGI,"$57,308"
+Unweighted median person AGI,"$58,750"
+25th percentile household AGI,"$2,489"
+75th percentile household AGI,"$86,301"
+90th percentile household AGI,"$140,239"
+95th percentile household AGI,"$236,759"
+Max household AGI,"$418,650,960"
+Total households with children,"663,513"
+Households with 1 child,"303,647"
+Households with 2 children,"209,804"
+Households with 3+ children,"150,062"
+Total children under 18,"1,247,050"
+Children under 6,"361,890"
+Children under 3,"177,869"

From 2324ff3bd6f9443116aa440f774865b3a4c23fa7 Mon Sep 17 00:00:00 2001
From: David Trimmer <david@policyengine.org>
Date: Fri, 6 Mar 2026 13:13:36 -0500
Subject: [PATCH 12/12] Reorganize SC H.4216 analysis with comprehensive RFA
 comparison

- Restructure into h4216_analysis/ folder with rate-specific subfolders
- Add analysis notebooks for both State and Test datasets at each rate
- Add comprehensive comparison markdown with bracket-by-bracket analysis
- Remove unused intermediate scripts and notebooks

Key findings:
- 5.21% rate: State -$393M, Test -$212M vs RFA -$309M
- 5.39% rate: State -$198M, Test -$93M vs RFA -$119M
- Primary driver: millionaire distribution (State has 90% more, Test has 41% fewer)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 .../5.21_rate/rfa_h4216_5.21_analysis.csv     |  16 +
 .../state/pe_h4216_5.21_state_analysis.csv    |  16 +
 .../state/sc_h4216_5.21_state_analysis.ipynb  | 550 ++++++++++++
 .../5.21_rate/test/pe_h4216_5.21_analysis.csv |  16 +
 .../test/sc_h4216_5.21_analysis.ipynb         | 555 ++++++++++++
 .../5.39_rate}/rfa_h4216_analysis.csv         |   0
 .../state/pe_h4216_5.39_state_analysis.csv    |  16 +
 .../state/sc_h4216_5.39_state_analysis.ipynb  | 550 ++++++++++++
 .../test}/pe_h4216_test_analysis.csv          |   0
 .../test}/sc_h4216_test_analysis.ipynb        |  81 +-
 .../h4216_analysis_comparison.md              | 286 ++++++
 us/states/sc/h4216_analysis_comparison.md     | 174 ----
 us/states/sc/sc_h4216_budget_impact.py        |  68 --
 us/states/sc/sc_h4216_dataset_comparison.py   |  92 --
 us/states/sc/sc_h4216_reform_analysis.ipynb   | 831 ------------------
 us/states/sc/sc_h4216_tax_impact_analysis.csv |  16 -
 16 files changed, 2009 insertions(+), 1258 deletions(-)
 create mode 100644 us/states/sc/h4216_analysis/5.21_rate/rfa_h4216_5.21_analysis.csv
 create mode 100644 us/states/sc/h4216_analysis/5.21_rate/state/pe_h4216_5.21_state_analysis.csv
 create mode 100644 us/states/sc/h4216_analysis/5.21_rate/state/sc_h4216_5.21_state_analysis.ipynb
 create mode 100644 us/states/sc/h4216_analysis/5.21_rate/test/pe_h4216_5.21_analysis.csv
 create mode 100644 us/states/sc/h4216_analysis/5.21_rate/test/sc_h4216_5.21_analysis.ipynb
 rename us/states/sc/{ => h4216_analysis/5.39_rate}/rfa_h4216_analysis.csv (100%)
 create mode 100644 us/states/sc/h4216_analysis/5.39_rate/state/pe_h4216_5.39_state_analysis.csv
 create mode 100644 us/states/sc/h4216_analysis/5.39_rate/state/sc_h4216_5.39_state_analysis.ipynb
 rename us/states/sc/{ => h4216_analysis/5.39_rate/test}/pe_h4216_test_analysis.csv (100%)
 rename us/states/sc/{ => h4216_analysis/5.39_rate/test}/sc_h4216_test_analysis.ipynb (87%)
 create mode 100644 us/states/sc/h4216_analysis/h4216_analysis_comparison.md
 delete mode 100644 us/states/sc/h4216_analysis_comparison.md
 delete mode 100644 us/states/sc/sc_h4216_budget_impact.py
 delete mode 100644 us/states/sc/sc_h4216_dataset_comparison.py
 delete mode 100644 us/states/sc/sc_h4216_reform_analysis.ipynb
 delete mode 100644 us/states/sc/sc_h4216_tax_impact_analysis.csv

diff --git a/us/states/sc/h4216_analysis/5.21_rate/rfa_h4216_5.21_analysis.csv b/us/states/sc/h4216_analysis/5.21_rate/rfa_h4216_5.21_analysis.csv
new file mode 100644
index 0000000..a150bea
--- /dev/null
+++ b/us/states/sc/h4216_analysis/5.21_rate/rfa_h4216_5.21_analysis.csv
@@ -0,0 +1,16 @@
+Federal AGI Range,Est # Returns,Est % Returns,Old Avg Tax Liability,New Avg Tax Liability,Returns with Tax Change,% Returns in Range with Change,Old Avg Tax (Changed),New Avg Tax (Changed),Avg Tax Change,Total Dollar Change,Tax Decrease # Returns,Tax Decrease % in Range,Total Decrease Amount,Avg Decrease Amount,Tax Increase # Returns,Tax Increase % in Range,Total Increase Amount,Avg Increase Amount,No Tax Change # Returns,No Change % Returns,Zero Tax # Returns,Zero Tax % Returns
+$0*,78854,2.9%,$50,$42,1080,1.4%,$3683,$3062,$-622,$-671000,576,0.7%,$-704000,$-1222,504,0.6%,$34000,$68,77774,98.6%,77824,98.7%
+$1 to $10000,286253,10.4%,$3,$9,43699,15.3%,$20,$58,$38,$1653000,834,0.3%,$-78000,$-94,42865,15.0%,$1731000,$40,242554,84.7%,243249,85.0%
+$10001 to $20000,310122,11.2%,$16,$26,75652,24.4%,$67,$105,$38,$2867000,5591,1.8%,$-363000,$-65,70060,22.6%,$3230000,$46,234471,75.6%,235107,75.8%
+$20001 to $30000,275560,10.0%,$107,$110,140713,51.1%,$210,$216,$5,$762000,51551,18.7%,$-2682000,$-52,89162,32.4%,$3444000,$39,134847,48.9%,134332,48.7%
+$30001 to $40000,269566,9.8%,$288,$216,160474,59.5%,$483,$362,$-121,$-19416000,131752,48.9%,$-21120000,$-160,28722,10.7%,$1704000,$59,109091,40.5%,110638,41.0%
+$40001 to $50000,234386,8.5%,$569,$388,174125,74.3%,$767,$522,$-244,$-42568000,127554,54.4%,$-46871000,$-367,46572,19.9%,$4303000,$92,60260,25.7%,61891,26.4%
+$50001 to $75000,407593,14.8%,$1192,$971,351754,86.3%,$1381,$1125,$-256,$-89935000,287674,70.6%,$-101116000,$-351,64080,15.7%,$11181000,$174,55839,13.7%,61960,15.2%
+$75001 to $100000,250437,9.1%,$2020,$1826,225194,89.9%,$2246,$2030,$-216,$-48624000,177430,70.8%,$-61900000,$-349,47764,19.1%,$13276000,$278,25243,10.1%,27729,11.1%
+$100001 to $150000,298343,10.8%,$3258,$3171,289948,97.2%,$3352,$3262,$-90,$-26092000,199040,66.7%,$-58517000,$-294,90908,30.5%,$32425000,$357,8395,2.8%,9188,3.1%
+$150001 to $200000,143398,5.2%,$5518,$5684,141433,98.6%,$5595,$5763,$168,$23766000,61936,43.2%,$-14937000,$-241,79497,55.4%,$38703000,$487,1965,1.4%,1459,1.0%
+$200001 to $300000,109340,4.0%,$8741,$8777,108016,98.8%,$8848,$8885,$37,$3955000,63636,58.2%,$-27603000,$-434,44380,40.6%,$31558000,$711,1324,1.2%,945,0.9%
+$300001 to $500000,56123,2.0%,$14926,$14355,55090,98.2%,$15206,$14624,$-582,$-32054000,42933,76.5%,$-47609000,$-1109,12157,21.7%,$15555000,$1280,1032,1.8%,762,1.4%
+$500001 to $1000000,25664,0.9%,$25969,$24512,24758,96.5%,$26919,$25410,$-1510,$-37381000,19803,77.2%,$-51185000,$-2585,4955,19.3%,$13804000,$2786,906,3.5%,684,2.7%
+Over $1000000,11936,0.4%,$78228,$74458,11159,93.5%,$83671,$79639,$-4031,$-44989000,8693,72.8%,$-87454000,$-10060,2466,20.7%,$42465000,$17221,776,6.5%,703,5.9%
+Total,2757573,100.0%,$2321,$2209,1803095,65.4%,$3549,$3378,$-171,$-308700000,1179002,42.8%,$-522100000,$-443,624092,22.6%,$213400000,$342,954478,34.6%,966471,35.0%
diff --git a/us/states/sc/h4216_analysis/5.21_rate/state/pe_h4216_5.21_state_analysis.csv b/us/states/sc/h4216_analysis/5.21_rate/state/pe_h4216_5.21_state_analysis.csv
new file mode 100644
index 0000000..5d7b774
--- /dev/null
+++ b/us/states/sc/h4216_analysis/5.21_rate/state/pe_h4216_5.21_state_analysis.csv
@@ -0,0 +1,16 @@
+Federal AGI Range,Est # Returns,Est % Returns,Old Avg Tax Liability,New Avg Tax Liability,Returns with Tax Change,% Returns in Range with Change,Old Avg Tax (Changed),New Avg Tax (Changed),Avg Tax Change,Total Dollar Change,Tax Decrease # Returns,Tax Decrease % in Range,Total Decrease Amount,Avg Decrease Amount,Tax Increase # Returns,Tax Increase % in Range,Total Increase Amount,Avg Increase Amount,No Tax Change # Returns,No Change % Returns,Zero Tax # Returns,Zero Tax % Returns
+$0*,619010,21.1%,$0,$0,0,0.0%,$0,$0,$0,$0,0,0.0%,$0,$0,0,0.0%,$0,$0,619010,100.0%,619010,100.0%
+$1 to $10000,502276,17.1%,$0,$0,0,0.0%,$0,$0,$0,$0,0,0.0%,$0,$0,0,0.0%,$0,$0,502276,100.0%,502276,100.0%
+$10001 to $20000,279412,9.5%,$0,$10,53961,19.3%,$0,$50,$50,$2672942,0,0.0%,$0,$0,53961,19.3%,$2672922,$50,225451,80.7%,225413,80.7%
+$20001 to $30000,252863,8.6%,$64,$101,136052,53.8%,$119,$188,$68,$9294693,5029,2.0%,$-40734,$-8,131023,51.8%,$9335378,$71,116811,46.2%,116751,46.2%
+$30001 to $40000,215980,7.4%,$225,$200,135926,62.9%,$356,$316,$-40,$-5431497,88710,41.1%,$-8472465,$-96,47216,21.9%,$3040994,$64,80055,37.1%,79265,36.7%
+$40001 to $50000,197525,6.7%,$547,$404,152733,77.3%,$706,$522,$-184,$-28145982,99989,50.6%,$-34226980,$-342,52744,26.7%,$6080948,$115,44792,22.7%,44131,22.3%
+$50001 to $75000,300857,10.2%,$822,$722,254734,84.7%,$971,$853,$-118,$-30064724,164685,54.7%,$-45636192,$-277,90049,29.9%,$15571469,$173,46123,15.3%,46125,15.3%
+$75001 to $100000,177284,6.0%,$1781,$1631,168284,94.9%,$1876,$1718,$-157,$-26475178,128443,72.5%,$-39583444,$-308,39841,22.5%,$13108268,$329,9000,5.1%,9124,5.1%
+$100001 to $150000,187946,6.4%,$3292,$3387,186839,99.4%,$3311,$3407,$96,$17889888,111928,59.6%,$-22415936,$-200,74911,39.9%,$40305824,$538,1107,0.6%,1105,0.6%
+$150001 to $200000,73396,2.5%,$6049,$6413,73395,100.0%,$6049,$6412,$363,$26678432,14400,19.6%,$-3249580,$-226,58996,80.4%,$29928012,$507,1,0.0%,0,0.0%
+$200001 to $300000,52882,1.8%,$9164,$9358,52878,100.0%,$9164,$9358,$194,$10258680,21154,40.0%,$-5374373,$-254,31724,60.0%,$15633049,$493,4,0.0%,0,0.0%
+$300001 to $500000,36977,1.3%,$17163,$16717,36977,100.0%,$17163,$16717,$-447,$-16518335,28313,76.6%,$-27952982,$-987,8664,23.4%,$11434646,$1320,0,0.0%,0,0.0%
+$500001 to $1000000,16526,0.6%,$26140,$24911,16526,100.0%,$26140,$24911,$-1229,$-20314260,14769,89.4%,$-25823908,$-1749,1757,10.6%,$5509648,$3136,0,0.0%,0,0.0%
+Over $1000000,22686,0.8%,$139623,$124950,22686,100.0%,$139623,$124950,$-14672,$-332860608,22658,99.9%,$-333138432,$-14703,29,0.1%,$277836,$9684,0,0.0%,0,0.0%
+Total,2935621,100.0%,$2220,$2086,1290992,44.0%,$5048,$4744,$-304,$-393015936,700078,23.8%,$-545915008,$-780,590915,20.1%,$152898992,$259,1644629,56.0%,1643201,56.0%
diff --git a/us/states/sc/h4216_analysis/5.21_rate/state/sc_h4216_5.21_state_analysis.ipynb b/us/states/sc/h4216_analysis/5.21_rate/state/sc_h4216_5.21_state_analysis.ipynb
new file mode 100644
index 0000000..b58e742
--- /dev/null
+++ b/us/states/sc/h4216_analysis/5.21_rate/state/sc_h4216_5.21_state_analysis.ipynb
@@ -0,0 +1,550 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "cell-0",
+   "metadata": {},
+   "source": [
+    "# SC H.4216 Tax Reform Analysis - 5.21% Top Rate (State Dataset)\n",
+    "\n",
+    "This notebook produces analysis in the same format as the RFA fiscal note for direct comparison.\n",
+    "\n",
+    "**Dataset:** `hf://policyengine/policyengine-us-data/states/SC.h5` (Production)\n",
+    "\n",
+    "**Reform:** H.4216 with 5.21% top rate (bill default)\n",
+    "\n",
+    "**RFA Estimate:** -$308,700,000"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "cell-1",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from policyengine_us import Microsimulation\n",
+    "from policyengine_us.reforms.states.sc.h4216.sc_h4216 import create_sc_h4216\n",
+    "from policyengine_core.reforms import Reform\n",
+    "import pandas as pd\n",
+    "import numpy as np\n",
+    "\n",
+    "SC_DATASET = \"hf://policyengine/policyengine-us-data/states/SC.h5\"\n",
+    "TAX_YEAR = 2026\n",
+    "TOP_RATE = 0.0521  # 5.21% top rate\n",
+    "RFA_ESTIMATE = -308700000"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "id": "cell-2",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Loading simulations...\n",
+      "Done!\n"
+     ]
+    }
+   ],
+   "source": [
+    "def create_h4216_reform(top_rate=0.0521):\n",
+    "    \"\"\"\n",
+    "    SC H.4216 Reform:\n",
+    "    - 1.99% up to $30k\n",
+    "    - top_rate over $30k (default 5.21% for bill version)\n",
+    "    \"\"\"\n",
+    "    param_reform = Reform.from_dict(\n",
+    "        {\n",
+    "            \"gov.contrib.states.sc.h4216.in_effect\": {\n",
+    "                \"2026-01-01.2100-12-31\": True\n",
+    "            },\n",
+    "            \"gov.contrib.states.sc.h4216.rates[1].rate\": {\n",
+    "                \"2026-01-01.2100-12-31\": top_rate\n",
+    "            }\n",
+    "        },\n",
+    "        country_id=\"us\",\n",
+    "    )\n",
+    "    base_reform = create_sc_h4216()\n",
+    "    return (base_reform, param_reform)\n",
+    "\n",
+    "print(\"Loading simulations...\")\n",
+    "baseline = Microsimulation(dataset=SC_DATASET)\n",
+    "reform_sim = Microsimulation(dataset=SC_DATASET, reform=create_h4216_reform(TOP_RATE))\n",
+    "print(\"Done!\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "id": "cell-3",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Total tax units: 49,486\n",
+      "Weighted tax units: 2,935,621\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Get data - use .values to avoid double-weighting\n",
+    "baseline_tax = baseline.calculate(\"sc_income_tax\", period=TAX_YEAR, map_to=\"tax_unit\").values\n",
+    "reform_tax = reform_sim.calculate(\"sc_income_tax\", period=TAX_YEAR, map_to=\"tax_unit\").values\n",
+    "agi = baseline.calculate(\"adjusted_gross_income\", period=TAX_YEAR, map_to=\"tax_unit\").values\n",
+    "weight = baseline.calculate(\"tax_unit_weight\", period=TAX_YEAR).values\n",
+    "\n",
+    "tax_change = reform_tax - baseline_tax\n",
+    "\n",
+    "print(f\"Total tax units: {len(baseline_tax):,}\")\n",
+    "print(f\"Weighted tax units: {weight.sum():,.0f}\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "id": "cell-4",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Bracket analysis complete!\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Define income brackets matching RFA exactly\n",
+    "income_brackets = [\n",
+    "    (float('-inf'), 0, \"$0*\"),\n",
+    "    (0, 10000, \"$1 to $10000\"),\n",
+    "    (10000, 20000, \"$10001 to $20000\"),\n",
+    "    (20000, 30000, \"$20001 to $30000\"),\n",
+    "    (30000, 40000, \"$30001 to $40000\"),\n",
+    "    (40000, 50000, \"$40001 to $50000\"),\n",
+    "    (50000, 75000, \"$50001 to $75000\"),\n",
+    "    (75000, 100000, \"$75001 to $100000\"),\n",
+    "    (100000, 150000, \"$100001 to $150000\"),\n",
+    "    (150000, 200000, \"$150001 to $200000\"),\n",
+    "    (200000, 300000, \"$200001 to $300000\"),\n",
+    "    (300000, 500000, \"$300001 to $500000\"),\n",
+    "    (500000, 1000000, \"$500001 to $1000000\"),\n",
+    "    (1000000, float('inf'), \"Over $1000000\")\n",
+    "]\n",
+    "\n",
+    "total_weight = weight.sum()\n",
+    "results = []\n",
+    "\n",
+    "for lower, upper, label in income_brackets:\n",
+    "    if lower == float('-inf'):\n",
+    "        mask = agi <= upper\n",
+    "    elif upper == float('inf'):\n",
+    "        mask = agi > lower\n",
+    "    else:\n",
+    "        mask = (agi > lower) & (agi <= upper)\n",
+    "    \n",
+    "    if mask.sum() == 0:\n",
+    "        continue\n",
+    "    \n",
+    "    # Basic stats\n",
+    "    est_returns = weight[mask].sum()\n",
+    "    pct_returns = est_returns / total_weight * 100\n",
+    "    \n",
+    "    old_avg_tax = np.average(baseline_tax[mask], weights=weight[mask]) if est_returns > 0 else 0\n",
+    "    new_avg_tax = np.average(reform_tax[mask], weights=weight[mask]) if est_returns > 0 else 0\n",
+    "    \n",
+    "    # Returns with tax change (threshold $1)\n",
+    "    change_mask = mask & (np.abs(tax_change) > 1)\n",
+    "    returns_with_change = weight[change_mask].sum()\n",
+    "    pct_with_change = returns_with_change / est_returns * 100 if est_returns > 0 else 0\n",
+    "    \n",
+    "    if returns_with_change > 0:\n",
+    "        old_avg_changed = np.average(baseline_tax[change_mask], weights=weight[change_mask])\n",
+    "        new_avg_changed = np.average(reform_tax[change_mask], weights=weight[change_mask])\n",
+    "        avg_change = np.average(tax_change[change_mask], weights=weight[change_mask])\n",
+    "    else:\n",
+    "        old_avg_changed = 0\n",
+    "        new_avg_changed = 0\n",
+    "        avg_change = 0\n",
+    "    \n",
+    "    total_change = (tax_change[mask] * weight[mask]).sum()\n",
+    "    \n",
+    "    # Tax decrease\n",
+    "    decrease_mask = mask & (tax_change < -1)\n",
+    "    decrease_returns = weight[decrease_mask].sum()\n",
+    "    decrease_pct = decrease_returns / est_returns * 100 if est_returns > 0 else 0\n",
+    "    total_decrease = (tax_change[decrease_mask] * weight[decrease_mask]).sum() if decrease_returns > 0 else 0\n",
+    "    avg_decrease = np.average(tax_change[decrease_mask], weights=weight[decrease_mask]) if decrease_returns > 0 else 0\n",
+    "    \n",
+    "    # Tax increase\n",
+    "    increase_mask = mask & (tax_change > 1)\n",
+    "    increase_returns = weight[increase_mask].sum()\n",
+    "    increase_pct = increase_returns / est_returns * 100 if est_returns > 0 else 0\n",
+    "    total_increase = (tax_change[increase_mask] * weight[increase_mask]).sum() if increase_returns > 0 else 0\n",
+    "    avg_increase = np.average(tax_change[increase_mask], weights=weight[increase_mask]) if increase_returns > 0 else 0\n",
+    "    \n",
+    "    # No change\n",
+    "    no_change_mask = mask & (np.abs(tax_change) <= 1)\n",
+    "    no_change_returns = weight[no_change_mask].sum()\n",
+    "    no_change_pct = no_change_returns / est_returns * 100 if est_returns > 0 else 0\n",
+    "    \n",
+    "    # Zero tax\n",
+    "    zero_tax_mask = mask & (reform_tax <= 0)\n",
+    "    zero_tax_returns = weight[zero_tax_mask].sum()\n",
+    "    zero_tax_pct = zero_tax_returns / est_returns * 100 if est_returns > 0 else 0\n",
+    "    \n",
+    "    results.append({\n",
+    "        \"Federal AGI Range\": label,\n",
+    "        \"Est # Returns\": int(round(est_returns)),\n",
+    "        \"Est % Returns\": f\"{pct_returns:.1f}%\",\n",
+    "        \"Old Avg Tax Liability\": f\"${int(round(old_avg_tax))}\",\n",
+    "        \"New Avg Tax Liability\": f\"${int(round(new_avg_tax))}\",\n",
+    "        \"Returns with Tax Change\": int(round(returns_with_change)),\n",
+    "        \"% Returns in Range with Change\": f\"{pct_with_change:.1f}%\",\n",
+    "        \"Old Avg Tax (Changed)\": f\"${int(round(old_avg_changed))}\",\n",
+    "        \"New Avg Tax (Changed)\": f\"${int(round(new_avg_changed))}\",\n",
+    "        \"Avg Tax Change\": f\"${int(round(avg_change))}\",\n",
+    "        \"Total Dollar Change\": f\"${int(round(total_change))}\",\n",
+    "        \"Tax Decrease # Returns\": int(round(decrease_returns)),\n",
+    "        \"Tax Decrease % in Range\": f\"{decrease_pct:.1f}%\",\n",
+    "        \"Total Decrease Amount\": f\"${int(round(total_decrease))}\",\n",
+    "        \"Avg Decrease Amount\": f\"${int(round(avg_decrease))}\",\n",
+    "        \"Tax Increase # Returns\": int(round(increase_returns)),\n",
+    "        \"Tax Increase % in Range\": f\"{increase_pct:.1f}%\",\n",
+    "        \"Total Increase Amount\": f\"${int(round(total_increase))}\",\n",
+    "        \"Avg Increase Amount\": f\"${int(round(avg_increase))}\",\n",
+    "        \"No Tax Change # Returns\": int(round(no_change_returns)),\n",
+    "        \"No Change % Returns\": f\"{no_change_pct:.1f}%\",\n",
+    "        \"Zero Tax # Returns\": int(round(zero_tax_returns)),\n",
+    "        \"Zero Tax % Returns\": f\"{zero_tax_pct:.1f}%\"\n",
+    "    })\n",
+    "\n",
+    "print(\"Bracket analysis complete!\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "id": "cell-5",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Totals calculated!\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Calculate totals\n",
+    "change_mask_all = np.abs(tax_change) > 1\n",
+    "decrease_mask_all = tax_change < -1\n",
+    "increase_mask_all = tax_change > 1\n",
+    "no_change_mask_all = np.abs(tax_change) <= 1\n",
+    "zero_tax_mask_all = reform_tax <= 0\n",
+    "\n",
+    "total_old_avg = np.average(baseline_tax, weights=weight)\n",
+    "total_new_avg = np.average(reform_tax, weights=weight)\n",
+    "total_change_amount = (tax_change * weight).sum()\n",
+    "\n",
+    "returns_with_change_all = weight[change_mask_all].sum()\n",
+    "old_avg_changed_all = np.average(baseline_tax[change_mask_all], weights=weight[change_mask_all]) if returns_with_change_all > 0 else 0\n",
+    "new_avg_changed_all = np.average(reform_tax[change_mask_all], weights=weight[change_mask_all]) if returns_with_change_all > 0 else 0\n",
+    "avg_change_all = np.average(tax_change[change_mask_all], weights=weight[change_mask_all]) if returns_with_change_all > 0 else 0\n",
+    "\n",
+    "decrease_returns_all = weight[decrease_mask_all].sum()\n",
+    "total_decrease_all = (tax_change[decrease_mask_all] * weight[decrease_mask_all]).sum()\n",
+    "avg_decrease_all = np.average(tax_change[decrease_mask_all], weights=weight[decrease_mask_all]) if decrease_returns_all > 0 else 0\n",
+    "\n",
+    "increase_returns_all = weight[increase_mask_all].sum()\n",
+    "total_increase_all = (tax_change[increase_mask_all] * weight[increase_mask_all]).sum()\n",
+    "avg_increase_all = np.average(tax_change[increase_mask_all], weights=weight[increase_mask_all]) if increase_returns_all > 0 else 0\n",
+    "\n",
+    "no_change_returns_all = weight[no_change_mask_all].sum()\n",
+    "zero_tax_returns_all = weight[zero_tax_mask_all].sum()\n",
+    "\n",
+    "results.append({\n",
+    "    \"Federal AGI Range\": \"Total\",\n",
+    "    \"Est # Returns\": int(round(total_weight)),\n",
+    "    \"Est % Returns\": \"100.0%\",\n",
+    "    \"Old Avg Tax Liability\": f\"${int(round(total_old_avg))}\",\n",
+    "    \"New Avg Tax Liability\": f\"${int(round(total_new_avg))}\",\n",
+    "    \"Returns with Tax Change\": int(round(returns_with_change_all)),\n",
+    "    \"% Returns in Range with Change\": f\"{returns_with_change_all / total_weight * 100:.1f}%\",\n",
+    "    \"Old Avg Tax (Changed)\": f\"${int(round(old_avg_changed_all))}\",\n",
+    "    \"New Avg Tax (Changed)\": f\"${int(round(new_avg_changed_all))}\",\n",
+    "    \"Avg Tax Change\": f\"${int(round(avg_change_all))}\",\n",
+    "    \"Total Dollar Change\": f\"${int(round(total_change_amount))}\",\n",
+    "    \"Tax Decrease # Returns\": int(round(decrease_returns_all)),\n",
+    "    \"Tax Decrease % in Range\": f\"{decrease_returns_all / total_weight * 100:.1f}%\",\n",
+    "    \"Total Decrease Amount\": f\"${int(round(total_decrease_all))}\",\n",
+    "    \"Avg Decrease Amount\": f\"${int(round(avg_decrease_all))}\",\n",
+    "    \"Tax Increase # Returns\": int(round(increase_returns_all)),\n",
+    "    \"Tax Increase % in Range\": f\"{increase_returns_all / total_weight * 100:.1f}%\",\n",
+    "    \"Total Increase Amount\": f\"${int(round(total_increase_all))}\",\n",
+    "    \"Avg Increase Amount\": f\"${int(round(avg_increase_all))}\",\n",
+    "    \"No Tax Change # Returns\": int(round(no_change_returns_all)),\n",
+    "    \"No Change % Returns\": f\"{no_change_returns_all / total_weight * 100:.1f}%\",\n",
+    "    \"Zero Tax # Returns\": int(round(zero_tax_returns_all)),\n",
+    "    \"Zero Tax % Returns\": f\"{zero_tax_returns_all / total_weight * 100:.1f}%\"\n",
+    "})\n",
+    "\n",
+    "df_results = pd.DataFrame(results)\n",
+    "print(\"Totals calculated!\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "id": "cell-6",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "====================================================================================================\n",
+      "H.4216 - POLICYENGINE ANALYSIS (State Dataset, 5.21% Top Rate)\n",
+      "====================================================================================================\n",
+      "\n",
+      "Total Returns: 2,935,621\n",
+      "General Fund Impact: $-393,015,936\n",
+      "\n",
+      "RFA Estimate: $-308,700,000\n",
+      "Difference: $-84,315,936\n",
+      "Accuracy: 72.7%\n",
+      "====================================================================================================\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Display summary\n",
+    "print(\"=\"*100)\n",
+    "print(f\"H.4216 - POLICYENGINE ANALYSIS (State Dataset, {TOP_RATE*100:.2f}% Top Rate)\")\n",
+    "print(\"=\"*100)\n",
+    "print(f\"\\nTotal Returns: {int(total_weight):,}\")\n",
+    "print(f\"General Fund Impact: ${total_change_amount:,.0f}\")\n",
+    "print(f\"\\nRFA Estimate: ${RFA_ESTIMATE:,}\")\n",
+    "print(f\"Difference: ${total_change_amount - RFA_ESTIMATE:,.0f}\")\n",
+    "print(f\"Accuracy: {(1 - abs(total_change_amount - RFA_ESTIMATE) / abs(RFA_ESTIMATE)) * 100:.1f}%\")\n",
+    "print(\"=\"*100)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "id": "cell-7",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Exported to: pe_h4216_5.21_state_analysis.csv\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Export to CSV in RFA format\n",
+    "df_results.to_csv('pe_h4216_5.21_state_analysis.csv', index=False)\n",
+    "print(\"Exported to: pe_h4216_5.21_state_analysis.csv\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "id": "cell-8",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "KEY METRICS:\n",
+      "  Federal AGI Range  Est # Returns Est % Returns Old Avg Tax Liability New Avg Tax Liability Total Dollar Change\n",
+      "                $0*         619010         21.1%                    $0                    $0                  $0\n",
+      "       $1 to $10000         502276         17.1%                    $0                    $0                  $0\n",
+      "   $10001 to $20000         279412          9.5%                    $0                   $10            $2672942\n",
+      "   $20001 to $30000         252863          8.6%                   $64                  $101            $9294693\n",
+      "   $30001 to $40000         215980          7.4%                  $225                  $200           $-5431497\n",
+      "   $40001 to $50000         197525          6.7%                  $547                  $404          $-28145982\n",
+      "   $50001 to $75000         300857         10.2%                  $822                  $722          $-30064724\n",
+      "  $75001 to $100000         177284          6.0%                 $1781                 $1631          $-26475178\n",
+      " $100001 to $150000         187946          6.4%                 $3292                 $3387           $17889888\n",
+      " $150001 to $200000          73396          2.5%                 $6049                 $6413           $26678432\n",
+      " $200001 to $300000          52882          1.8%                 $9164                 $9358           $10258680\n",
+      " $300001 to $500000          36977          1.3%                $17163                $16717          $-16518335\n",
+      "$500001 to $1000000          16526          0.6%                $26140                $24911          $-20314260\n",
+      "      Over $1000000          22686          0.8%               $139623               $124950         $-332860608\n",
+      "              Total        2935621        100.0%                 $2220                 $2086         $-393015936\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Display key columns for quick comparison\n",
+    "display_cols = [\n",
+    "    \"Federal AGI Range\", \"Est # Returns\", \"Est % Returns\",\n",
+    "    \"Old Avg Tax Liability\", \"New Avg Tax Liability\", \"Total Dollar Change\"\n",
+    "]\n",
+    "print(\"\\nKEY METRICS:\")\n",
+    "print(df_results[display_cols].to_string(index=False))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "cell-9",
+   "metadata": {},
+   "source": [
+    "## Side-by-Side Comparison with RFA"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "id": "cell-10",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "====================================================================================================\n",
+      "POLICYENGINE (State) vs RFA COMPARISON (5.21% Rate)\n",
+      "====================================================================================================\n",
+      "          AGI Range PE Returns RFA Returns     PE Impact    RFA Impact          Diff\n",
+      "                $0*    619,010      78,854            $0     $-671,000     $+671,000\n",
+      "       $1 to $10000    502,276     286,253            $0    $1,653,000   $-1,653,000\n",
+      "   $10001 to $20000    279,412     310,122    $2,672,942    $2,867,000     $-194,058\n",
+      "   $20001 to $30000    252,863     275,560    $9,294,693      $762,000   $+8,532,693\n",
+      "   $30001 to $40000    215,980     269,566   $-5,431,497  $-19,416,000  $+13,984,503\n",
+      "   $40001 to $50000    197,525     234,386  $-28,145,982  $-42,568,000  $+14,422,018\n",
+      "   $50001 to $75000    300,857     407,593  $-30,064,724  $-89,935,000  $+59,870,276\n",
+      "  $75001 to $100000    177,284     250,437  $-26,475,178  $-48,624,000  $+22,148,822\n",
+      " $100001 to $150000    187,946     298,343   $17,889,888  $-26,092,000  $+43,981,888\n",
+      " $150001 to $200000     73,396     143,398   $26,678,432   $23,766,000   $+2,912,432\n",
+      " $200001 to $300000     52,882     109,340   $10,258,680    $3,955,000   $+6,303,680\n",
+      " $300001 to $500000     36,977      56,123  $-16,518,335  $-32,054,000  $+15,535,665\n",
+      "$500001 to $1000000     16,526      25,664  $-20,314,260  $-37,381,000  $+17,066,740\n",
+      "      Over $1000000     22,686      11,936 $-332,860,608  $-44,989,000 $-287,871,608\n",
+      "              Total  2,935,621   2,757,573 $-393,015,936 $-308,700,000  $-84,315,936\n",
+      "====================================================================================================\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Load RFA data\n",
+    "rfa_df = pd.read_csv('../rfa_h4216_5.21_analysis.csv')\n",
+    "\n",
+    "def parse_dollar(val):\n",
+    "    if isinstance(val, str):\n",
+    "        return float(val.replace('$', '').replace(',', '').replace('%', ''))\n",
+    "    return val\n",
+    "\n",
+    "# Create comparison\n",
+    "comparison = []\n",
+    "for idx, pe_row in df_results.iterrows():\n",
+    "    agi_range = pe_row['Federal AGI Range']\n",
+    "    rfa_match = rfa_df[rfa_df['Federal AGI Range'] == agi_range]\n",
+    "    \n",
+    "    pe_returns = pe_row['Est # Returns']\n",
+    "    pe_impact = parse_dollar(pe_row['Total Dollar Change'])\n",
+    "    \n",
+    "    if len(rfa_match) > 0:\n",
+    "        rfa_returns = rfa_match['Est # Returns'].values[0]\n",
+    "        rfa_impact = parse_dollar(rfa_match['Total Dollar Change'].values[0])\n",
+    "    else:\n",
+    "        rfa_returns = 0\n",
+    "        rfa_impact = 0\n",
+    "    \n",
+    "    comparison.append({\n",
+    "        'AGI Range': agi_range,\n",
+    "        'PE Returns': f\"{pe_returns:,}\",\n",
+    "        'RFA Returns': f\"{rfa_returns:,}\" if rfa_returns else \"N/A\",\n",
+    "        'PE Impact': f\"${pe_impact:,.0f}\",\n",
+    "        'RFA Impact': f\"${rfa_impact:,.0f}\" if rfa_impact else \"N/A\",\n",
+    "        'Diff': f\"${pe_impact - rfa_impact:+,.0f}\" if rfa_impact else \"N/A\"\n",
+    "    })\n",
+    "\n",
+    "comparison_df = pd.DataFrame(comparison)\n",
+    "print(\"\\n\" + \"=\"*100)\n",
+    "print(\"POLICYENGINE (State) vs RFA COMPARISON (5.21% Rate)\")\n",
+    "print(\"=\"*100)\n",
+    "print(comparison_df.to_string(index=False))\n",
+    "print(\"=\"*100)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "id": "cell-11",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "========================================================================================================================\n",
+      "FULL POLICYENGINE ANALYSIS (RFA Format)\n",
+      "========================================================================================================================\n",
+      "  Federal AGI Range  Est # Returns Est % Returns Old Avg Tax Liability New Avg Tax Liability  Returns with Tax Change % Returns in Range with Change Old Avg Tax (Changed) New Avg Tax (Changed) Avg Tax Change Total Dollar Change  Tax Decrease # Returns Tax Decrease % in Range Total Decrease Amount Avg Decrease Amount  Tax Increase # Returns Tax Increase % in Range Total Increase Amount Avg Increase Amount  No Tax Change # Returns No Change % Returns  Zero Tax # Returns Zero Tax % Returns\n",
+      "                $0*         619010         21.1%                    $0                    $0                        0                           0.0%                    $0                    $0             $0                  $0                       0                    0.0%                    $0                  $0                       0                    0.0%                    $0                  $0                   619010              100.0%              619010             100.0%\n",
+      "       $1 to $10000         502276         17.1%                    $0                    $0                        0                           0.0%                    $0                    $0             $0                  $0                       0                    0.0%                    $0                  $0                       0                    0.0%                    $0                  $0                   502276              100.0%              502276             100.0%\n",
+      "   $10001 to $20000         279412          9.5%                    $0                   $10                    53961                          19.3%                    $0                   $50            $50            $2672942                       0                    0.0%                    $0                  $0                   53961                   19.3%              $2672922                 $50                   225451               80.7%              225413              80.7%\n",
+      "   $20001 to $30000         252863          8.6%                   $64                  $101                   136052                          53.8%                  $119                  $188            $68            $9294693                    5029                    2.0%               $-40734                 $-8                  131023                   51.8%              $9335378                 $71                   116811               46.2%              116751              46.2%\n",
+      "   $30001 to $40000         215980          7.4%                  $225                  $200                   135926                          62.9%                  $356                  $316           $-40           $-5431497                   88710                   41.1%             $-8472465                $-96                   47216                   21.9%              $3040994                 $64                    80055               37.1%               79265              36.7%\n",
+      "   $40001 to $50000         197525          6.7%                  $547                  $404                   152733                          77.3%                  $706                  $522          $-184          $-28145982                   99989                   50.6%            $-34226980               $-342                   52744                   26.7%              $6080948                $115                    44792               22.7%               44131              22.3%\n",
+      "   $50001 to $75000         300857         10.2%                  $822                  $722                   254734                          84.7%                  $971                  $853          $-118          $-30064724                  164685                   54.7%            $-45636192               $-277                   90049                   29.9%             $15571469                $173                    46123               15.3%               46125              15.3%\n",
+      "  $75001 to $100000         177284          6.0%                 $1781                 $1631                   168284                          94.9%                 $1876                 $1718          $-157          $-26475178                  128443                   72.5%            $-39583444               $-308                   39841                   22.5%             $13108268                $329                     9000                5.1%                9124               5.1%\n",
+      " $100001 to $150000         187946          6.4%                 $3292                 $3387                   186839                          99.4%                 $3311                 $3407            $96           $17889888                  111928                   59.6%            $-22415936               $-200                   74911                   39.9%             $40305824                $538                     1107                0.6%                1105               0.6%\n",
+      " $150001 to $200000          73396          2.5%                 $6049                 $6413                    73395                         100.0%                 $6049                 $6412           $363           $26678432                   14400                   19.6%             $-3249580               $-226                   58996                   80.4%             $29928012                $507                        1                0.0%                   0               0.0%\n",
+      " $200001 to $300000          52882          1.8%                 $9164                 $9358                    52878                         100.0%                 $9164                 $9358           $194           $10258680                   21154                   40.0%             $-5374373               $-254                   31724                   60.0%             $15633049                $493                        4                0.0%                   0               0.0%\n",
+      " $300001 to $500000          36977          1.3%                $17163                $16717                    36977                         100.0%                $17163                $16717          $-447          $-16518335                   28313                   76.6%            $-27952982               $-987                    8664                   23.4%             $11434646               $1320                        0                0.0%                   0               0.0%\n",
+      "$500001 to $1000000          16526          0.6%                $26140                $24911                    16526                         100.0%                $26140                $24911         $-1229          $-20314260                   14769                   89.4%            $-25823908              $-1749                    1757                   10.6%              $5509648               $3136                        0                0.0%                   0               0.0%\n",
+      "      Over $1000000          22686          0.8%               $139623               $124950                    22686                         100.0%               $139623               $124950        $-14672         $-332860608                   22658                   99.9%           $-333138432             $-14703                      29                    0.1%               $277836               $9684                        0                0.0%                   0               0.0%\n",
+      "              Total        2935621        100.0%                 $2220                 $2086                  1290992                          44.0%                 $5048                 $4744          $-304         $-393015936                  700078                   23.8%           $-545915008               $-780                  590915                   20.1%            $152898992                $259                  1644629               56.0%             1643201              56.0%\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Full results table\n",
+    "print(\"\\n\" + \"=\"*120)\n",
+    "print(\"FULL POLICYENGINE ANALYSIS (RFA Format)\")\n",
+    "print(\"=\"*120)\n",
+    "pd.set_option('display.max_columns', None)\n",
+    "pd.set_option('display.width', None)\n",
+    "print(df_results.to_string(index=False))"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.11.5"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/us/states/sc/h4216_analysis/5.21_rate/test/pe_h4216_5.21_analysis.csv b/us/states/sc/h4216_analysis/5.21_rate/test/pe_h4216_5.21_analysis.csv
new file mode 100644
index 0000000..99fdf7e
--- /dev/null
+++ b/us/states/sc/h4216_analysis/5.21_rate/test/pe_h4216_5.21_analysis.csv
@@ -0,0 +1,16 @@
+Federal AGI Range,Est # Returns,Est % Returns,Old Avg Tax Liability,New Avg Tax Liability,Returns with Tax Change,% Returns in Range with Change,Old Avg Tax (Changed),New Avg Tax (Changed),Avg Tax Change,Total Dollar Change,Tax Decrease # Returns,Tax Decrease % in Range,Total Decrease Amount,Avg Decrease Amount,Tax Increase # Returns,Tax Increase % in Range,Total Increase Amount,Avg Increase Amount,No Tax Change # Returns,No Change % Returns,Zero Tax # Returns,Zero Tax % Returns
+$0*,727881,26.9%,$0,$0,0,0.0%,$0,$0,$0,$0,0,0.0%,$0,$0,0,0.0%,$0,$0,727881,100.0%,727881,100.0%
+$1 to $10000,498186,18.4%,$0,$0,0,0.0%,$0,$0,$0,$0,0,0.0%,$0,$0,0,0.0%,$0,$0,498186,100.0%,498186,100.0%
+$10001 to $20000,233000,8.6%,$0,$4,16527,7.1%,$0,$51,$51,$847688,0,0.0%,$0,$0,16527,7.1%,$847510,$51,216473,92.9%,215471,92.5%
+$20001 to $30000,171515,6.3%,$40,$56,48979,28.6%,$131,$187,$56,$2756262,2691,1.6%,$-22726,$-8,46288,27.0%,$2778858,$60,122536,71.4%,121168,70.6%
+$30001 to $40000,157010,5.8%,$149,$135,70118,44.7%,$333,$302,$-31,$-2140517,45821,29.2%,$-3836658,$-84,24298,15.5%,$1696106,$70,86892,55.3%,86762,55.3%
+$40001 to $50000,132402,4.9%,$399,$301,95777,72.3%,$548,$413,$-135,$-12939930,49802,37.6%,$-16742836,$-336,45975,34.7%,$3801853,$83,36624,27.7%,35193,26.6%
+$50001 to $75000,245406,9.1%,$701,$576,205400,83.7%,$836,$687,$-149,$-30530120,139791,57.0%,$-40495060,$-290,65609,26.7%,$9964432,$152,40007,16.3%,39028,15.9%
+$75001 to $100000,165713,6.1%,$1452,$1261,163885,98.9%,$1468,$1275,$-193,$-31638784,120428,72.7%,$-44416856,$-369,43457,26.2%,$12778093,$294,1828,1.1%,1759,1.1%
+$100001 to $150000,225396,8.3%,$2929,$3055,220631,97.9%,$2992,$3121,$129,$28517960,121628,54.0%,$-24284616,$-200,99003,43.9%,$52802576,$533,4765,2.1%,4765,2.1%
+$150001 to $200000,42792,1.6%,$5236,$5812,41448,96.9%,$5235,$5829,$595,$24642470,7562,17.7%,$-786251,$-104,33886,79.2%,$25429746,$750,1344,3.1%,0,0.0%
+$200001 to $300000,55391,2.0%,$9952,$10126,55391,100.0%,$9952,$10126,$174,$9646339,25962,46.9%,$-7259498,$-280,29429,53.1%,$16905836,$574,0,0.0%,0,0.0%
+$300001 to $500000,32748,1.2%,$16226,$15433,32748,100.0%,$16226,$15433,$-793,$-25961084,26670,81.4%,$-27887880,$-1046,6078,18.6%,$1926795,$317,0,0.0%,0,0.0%
+$500001 to $1000000,11418,0.4%,$31912,$29003,11417,100.0%,$31913,$29004,$-2909,$-33216482,11403,99.9%,$-33299206,$-2920,15,0.1%,$82722,$5703,0,0.0%,0,0.0%
+Over $1000000,6993,0.3%,$171527,$151221,6993,100.0%,$171530,$151223,$-20306,$-141996240,6961,99.5%,$-146692704,$-21074,32,0.5%,$4696465,$147081,0,0.0%,0,0.0%
+Total,2705850,100.0%,$1488,$1410,969313,35.8%,$4145,$3926,$-219,$-212012432,558718,20.6%,$-345724288,$-619,410595,15.2%,$133710992,$326,1736536,64.2%,1730213,63.9%
diff --git a/us/states/sc/h4216_analysis/5.21_rate/test/sc_h4216_5.21_analysis.ipynb b/us/states/sc/h4216_analysis/5.21_rate/test/sc_h4216_5.21_analysis.ipynb
new file mode 100644
index 0000000..ae510a9
--- /dev/null
+++ b/us/states/sc/h4216_analysis/5.21_rate/test/sc_h4216_5.21_analysis.ipynb
@@ -0,0 +1,555 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "cell-0",
+   "metadata": {},
+   "source": [
+    "# SC H.4216 Tax Reform Analysis - 5.21% Top Rate\n",
+    "\n",
+    "This notebook produces analysis in the same format as the RFA fiscal note for direct comparison.\n",
+    "\n",
+    "**Dataset:** `hf://policyengine/test/mar/SC.h5`\n",
+    "\n",
+    "**Reform:** H.4216 with 5.21% top rate (bill default)\n",
+    "\n",
+    "**RFA Estimate:** -$308,700,000"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "cell-1",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from policyengine_us import Microsimulation\n",
+    "from policyengine_us.reforms.states.sc.h4216.sc_h4216 import create_sc_h4216\n",
+    "from policyengine_core.reforms import Reform\n",
+    "import pandas as pd\n",
+    "import numpy as np\n",
+    "\n",
+    "SC_DATASET = \"hf://policyengine/test/mar/SC.h5\"\n",
+    "TAX_YEAR = 2026\n",
+    "TOP_RATE = 0.0521  # 5.21% top rate\n",
+    "RFA_ESTIMATE = -308700000"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "id": "cell-2",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Loading simulations...\n",
+      "Done!\n"
+     ]
+    }
+   ],
+   "source": [
+    "def create_h4216_reform(top_rate=0.0521):\n",
+    "    \"\"\"\n",
+    "    SC H.4216 Reform:\n",
+    "    - 1.99% up to $30k\n",
+    "    - top_rate over $30k (default 5.21% for bill version)\n",
+    "    \"\"\"\n",
+    "    param_reform = Reform.from_dict(\n",
+    "        {\n",
+    "            \"gov.contrib.states.sc.h4216.in_effect\": {\n",
+    "                \"2026-01-01.2100-12-31\": True\n",
+    "            },\n",
+    "            \"gov.contrib.states.sc.h4216.rates[1].rate\": {\n",
+    "                \"2026-01-01.2100-12-31\": top_rate\n",
+    "            }\n",
+    "        },\n",
+    "        country_id=\"us\",\n",
+    "    )\n",
+    "    base_reform = create_sc_h4216()\n",
+    "    return (base_reform, param_reform)\n",
+    "\n",
+    "print(\"Loading simulations...\")\n",
+    "baseline = Microsimulation(dataset=SC_DATASET)\n",
+    "reform_sim = Microsimulation(dataset=SC_DATASET, reform=create_h4216_reform(TOP_RATE))\n",
+    "print(\"Done!\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "id": "cell-3",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Total tax units: 42,461\n",
+      "Weighted tax units: 2,705,850\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Get data - use .values to avoid double-weighting\n",
+    "baseline_tax = baseline.calculate(\"sc_income_tax\", period=TAX_YEAR, map_to=\"tax_unit\").values\n",
+    "reform_tax = reform_sim.calculate(\"sc_income_tax\", period=TAX_YEAR, map_to=\"tax_unit\").values\n",
+    "agi = baseline.calculate(\"adjusted_gross_income\", period=TAX_YEAR, map_to=\"tax_unit\").values\n",
+    "weight = baseline.calculate(\"tax_unit_weight\", period=TAX_YEAR).values\n",
+    "\n",
+    "tax_change = reform_tax - baseline_tax\n",
+    "\n",
+    "print(f\"Total tax units: {len(baseline_tax):,}\")\n",
+    "print(f\"Weighted tax units: {weight.sum():,.0f}\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "id": "cell-4",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Bracket analysis complete!\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Define income brackets matching RFA exactly\n",
+    "income_brackets = [\n",
+    "    (float('-inf'), 0, \"$0*\"),\n",
+    "    (0, 10000, \"$1 to $10000\"),\n",
+    "    (10000, 20000, \"$10001 to $20000\"),\n",
+    "    (20000, 30000, \"$20001 to $30000\"),\n",
+    "    (30000, 40000, \"$30001 to $40000\"),\n",
+    "    (40000, 50000, \"$40001 to $50000\"),\n",
+    "    (50000, 75000, \"$50001 to $75000\"),\n",
+    "    (75000, 100000, \"$75001 to $100000\"),\n",
+    "    (100000, 150000, \"$100001 to $150000\"),\n",
+    "    (150000, 200000, \"$150001 to $200000\"),\n",
+    "    (200000, 300000, \"$200001 to $300000\"),\n",
+    "    (300000, 500000, \"$300001 to $500000\"),\n",
+    "    (500000, 1000000, \"$500001 to $1000000\"),\n",
+    "    (1000000, float('inf'), \"Over $1000000\")\n",
+    "]\n",
+    "\n",
+    "total_weight = weight.sum()\n",
+    "results = []\n",
+    "\n",
+    "for lower, upper, label in income_brackets:\n",
+    "    if lower == float('-inf'):\n",
+    "        mask = agi <= upper\n",
+    "    elif upper == float('inf'):\n",
+    "        mask = agi > lower\n",
+    "    else:\n",
+    "        mask = (agi > lower) & (agi <= upper)\n",
+    "    \n",
+    "    if mask.sum() == 0:\n",
+    "        continue\n",
+    "    \n",
+    "    # Basic stats\n",
+    "    est_returns = weight[mask].sum()\n",
+    "    pct_returns = est_returns / total_weight * 100\n",
+    "    \n",
+    "    old_avg_tax = np.average(baseline_tax[mask], weights=weight[mask]) if est_returns > 0 else 0\n",
+    "    new_avg_tax = np.average(reform_tax[mask], weights=weight[mask]) if est_returns > 0 else 0\n",
+    "    \n",
+    "    # Returns with tax change (threshold $1)\n",
+    "    change_mask = mask & (np.abs(tax_change) > 1)\n",
+    "    returns_with_change = weight[change_mask].sum()\n",
+    "    pct_with_change = returns_with_change / est_returns * 100 if est_returns > 0 else 0\n",
+    "    \n",
+    "    if returns_with_change > 0:\n",
+    "        old_avg_changed = np.average(baseline_tax[change_mask], weights=weight[change_mask])\n",
+    "        new_avg_changed = np.average(reform_tax[change_mask], weights=weight[change_mask])\n",
+    "        avg_change = np.average(tax_change[change_mask], weights=weight[change_mask])\n",
+    "    else:\n",
+    "        old_avg_changed = 0\n",
+    "        new_avg_changed = 0\n",
+    "        avg_change = 0\n",
+    "    \n",
+    "    total_change = (tax_change[mask] * weight[mask]).sum()\n",
+    "    \n",
+    "    # Tax decrease\n",
+    "    decrease_mask = mask & (tax_change < -1)\n",
+    "    decrease_returns = weight[decrease_mask].sum()\n",
+    "    decrease_pct = decrease_returns / est_returns * 100 if est_returns > 0 else 0\n",
+    "    total_decrease = (tax_change[decrease_mask] * weight[decrease_mask]).sum() if decrease_returns > 0 else 0\n",
+    "    avg_decrease = np.average(tax_change[decrease_mask], weights=weight[decrease_mask]) if decrease_returns > 0 else 0\n",
+    "    \n",
+    "    # Tax increase\n",
+    "    increase_mask = mask & (tax_change > 1)\n",
+    "    increase_returns = weight[increase_mask].sum()\n",
+    "    increase_pct = increase_returns / est_returns * 100 if est_returns > 0 else 0\n",
+    "    total_increase = (tax_change[increase_mask] * weight[increase_mask]).sum() if increase_returns > 0 else 0\n",
+    "    avg_increase = np.average(tax_change[increase_mask], weights=weight[increase_mask]) if increase_returns > 0 else 0\n",
+    "    \n",
+    "    # No change\n",
+    "    no_change_mask = mask & (np.abs(tax_change) <= 1)\n",
+    "    no_change_returns = weight[no_change_mask].sum()\n",
+    "    no_change_pct = no_change_returns / est_returns * 100 if est_returns > 0 else 0\n",
+    "    \n",
+    "    # Zero tax\n",
+    "    zero_tax_mask = mask & (reform_tax <= 0)\n",
+    "    zero_tax_returns = weight[zero_tax_mask].sum()\n",
+    "    zero_tax_pct = zero_tax_returns / est_returns * 100 if est_returns > 0 else 0\n",
+    "    \n",
+    "    results.append({\n",
+    "        \"Federal AGI Range\": label,\n",
+    "        \"Est # Returns\": int(round(est_returns)),\n",
+    "        \"Est % Returns\": f\"{pct_returns:.1f}%\",\n",
+    "        \"Old Avg Tax Liability\": f\"${int(round(old_avg_tax))}\",\n",
+    "        \"New Avg Tax Liability\": f\"${int(round(new_avg_tax))}\",\n",
+    "        \"Returns with Tax Change\": int(round(returns_with_change)),\n",
+    "        \"% Returns in Range with Change\": f\"{pct_with_change:.1f}%\",\n",
+    "        \"Old Avg Tax (Changed)\": f\"${int(round(old_avg_changed))}\",\n",
+    "        \"New Avg Tax (Changed)\": f\"${int(round(new_avg_changed))}\",\n",
+    "        \"Avg Tax Change\": f\"${int(round(avg_change))}\",\n",
+    "        \"Total Dollar Change\": f\"${int(round(total_change))}\",\n",
+    "        \"Tax Decrease # Returns\": int(round(decrease_returns)),\n",
+    "        \"Tax Decrease % in Range\": f\"{decrease_pct:.1f}%\",\n",
+    "        \"Total Decrease Amount\": f\"${int(round(total_decrease))}\",\n",
+    "        \"Avg Decrease Amount\": f\"${int(round(avg_decrease))}\",\n",
+    "        \"Tax Increase # Returns\": int(round(increase_returns)),\n",
+    "        \"Tax Increase % in Range\": f\"{increase_pct:.1f}%\",\n",
+    "        \"Total Increase Amount\": f\"${int(round(total_increase))}\",\n",
+    "        \"Avg Increase Amount\": f\"${int(round(avg_increase))}\",\n",
+    "        \"No Tax Change # Returns\": int(round(no_change_returns)),\n",
+    "        \"No Change % Returns\": f\"{no_change_pct:.1f}%\",\n",
+    "        \"Zero Tax # Returns\": int(round(zero_tax_returns)),\n",
+    "        \"Zero Tax % Returns\": f\"{zero_tax_pct:.1f}%\"\n",
+    "    })\n",
+    "\n",
+    "print(\"Bracket analysis complete!\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "id": "cell-5",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Totals calculated!\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Calculate totals\n",
+    "change_mask_all = np.abs(tax_change) > 1\n",
+    "decrease_mask_all = tax_change < -1\n",
+    "increase_mask_all = tax_change > 1\n",
+    "no_change_mask_all = np.abs(tax_change) <= 1\n",
+    "zero_tax_mask_all = reform_tax <= 0\n",
+    "\n",
+    "total_old_avg = np.average(baseline_tax, weights=weight)\n",
+    "total_new_avg = np.average(reform_tax, weights=weight)\n",
+    "total_change_amount = (tax_change * weight).sum()\n",
+    "\n",
+    "returns_with_change_all = weight[change_mask_all].sum()\n",
+    "old_avg_changed_all = np.average(baseline_tax[change_mask_all], weights=weight[change_mask_all]) if returns_with_change_all > 0 else 0\n",
+    "new_avg_changed_all = np.average(reform_tax[change_mask_all], weights=weight[change_mask_all]) if returns_with_change_all > 0 else 0\n",
+    "avg_change_all = np.average(tax_change[change_mask_all], weights=weight[change_mask_all]) if returns_with_change_all > 0 else 0\n",
+    "\n",
+    "decrease_returns_all = weight[decrease_mask_all].sum()\n",
+    "total_decrease_all = (tax_change[decrease_mask_all] * weight[decrease_mask_all]).sum()\n",
+    "avg_decrease_all = np.average(tax_change[decrease_mask_all], weights=weight[decrease_mask_all]) if decrease_returns_all > 0 else 0\n",
+    "\n",
+    "increase_returns_all = weight[increase_mask_all].sum()\n",
+    "total_increase_all = (tax_change[increase_mask_all] * weight[increase_mask_all]).sum()\n",
+    "avg_increase_all = np.average(tax_change[increase_mask_all], weights=weight[increase_mask_all]) if increase_returns_all > 0 else 0\n",
+    "\n",
+    "no_change_returns_all = weight[no_change_mask_all].sum()\n",
+    "zero_tax_returns_all = weight[zero_tax_mask_all].sum()\n",
+    "\n",
+    "results.append({\n",
+    "    \"Federal AGI Range\": \"Total\",\n",
+    "    \"Est # Returns\": int(round(total_weight)),\n",
+    "    \"Est % Returns\": \"100.0%\",\n",
+    "    \"Old Avg Tax Liability\": f\"${int(round(total_old_avg))}\",\n",
+    "    \"New Avg Tax Liability\": f\"${int(round(total_new_avg))}\",\n",
+    "    \"Returns with Tax Change\": int(round(returns_with_change_all)),\n",
+    "    \"% Returns in Range with Change\": f\"{returns_with_change_all / total_weight * 100:.1f}%\",\n",
+    "    \"Old Avg Tax (Changed)\": f\"${int(round(old_avg_changed_all))}\",\n",
+    "    \"New Avg Tax (Changed)\": f\"${int(round(new_avg_changed_all))}\",\n",
+    "    \"Avg Tax Change\": f\"${int(round(avg_change_all))}\",\n",
+    "    \"Total Dollar Change\": f\"${int(round(total_change_amount))}\",\n",
+    "    \"Tax Decrease # Returns\": int(round(decrease_returns_all)),\n",
+    "    \"Tax Decrease % in Range\": f\"{decrease_returns_all / total_weight * 100:.1f}%\",\n",
+    "    \"Total Decrease Amount\": f\"${int(round(total_decrease_all))}\",\n",
+    "    \"Avg Decrease Amount\": f\"${int(round(avg_decrease_all))}\",\n",
+    "    \"Tax Increase # Returns\": int(round(increase_returns_all)),\n",
+    "    \"Tax Increase % in Range\": f\"{increase_returns_all / total_weight * 100:.1f}%\",\n",
+    "    \"Total Increase Amount\": f\"${int(round(total_increase_all))}\",\n",
+    "    \"Avg Increase Amount\": f\"${int(round(avg_increase_all))}\",\n",
+    "    \"No Tax Change # Returns\": int(round(no_change_returns_all)),\n",
+    "    \"No Change % Returns\": f\"{no_change_returns_all / total_weight * 100:.1f}%\",\n",
+    "    \"Zero Tax # Returns\": int(round(zero_tax_returns_all)),\n",
+    "    \"Zero Tax % Returns\": f\"{zero_tax_returns_all / total_weight * 100:.1f}%\"\n",
+    "})\n",
+    "\n",
+    "df_results = pd.DataFrame(results)\n",
+    "print(\"Totals calculated!\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "id": "cell-6",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "====================================================================================================\n",
+      "H.4216 - POLICYENGINE ANALYSIS (Test Dataset, 5.21% Top Rate)\n",
+      "====================================================================================================\n",
+      "\n",
+      "Total Returns: 2,705,849\n",
+      "General Fund Impact: $-212,012,432\n",
+      "\n",
+      "RFA Estimate: $-308,700,000\n",
+      "Difference: $96,687,568\n",
+      "Accuracy: 68.7%\n",
+      "====================================================================================================\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Display summary\n",
+    "print(\"=\"*100)\n",
+    "print(f\"H.4216 - POLICYENGINE ANALYSIS (Test Dataset, {TOP_RATE*100:.2f}% Top Rate)\")\n",
+    "print(\"=\"*100)\n",
+    "print(f\"\\nTotal Returns: {int(total_weight):,}\")\n",
+    "print(f\"General Fund Impact: ${total_change_amount:,.0f}\")\n",
+    "print(f\"\\nRFA Estimate: ${RFA_ESTIMATE:,}\")\n",
+    "print(f\"Difference: ${total_change_amount - RFA_ESTIMATE:,.0f}\")\n",
+    "print(f\"Accuracy: {(1 - abs(total_change_amount - RFA_ESTIMATE) / abs(RFA_ESTIMATE)) * 100:.1f}%\")\n",
+    "print(\"=\"*100)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "id": "cell-7",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Exported to: pe_h4216_5.21_analysis.csv\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Export to CSV in RFA format\n",
+    "df_results.to_csv('pe_h4216_5.21_analysis.csv', index=False)\n",
+    "print(\"Exported to: pe_h4216_5.21_analysis.csv\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "id": "cell-8",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "KEY METRICS:\n",
+      "  Federal AGI Range  Est # Returns Est % Returns Old Avg Tax Liability New Avg Tax Liability Total Dollar Change\n",
+      "                $0*         727881         26.9%                    $0                    $0                  $0\n",
+      "       $1 to $10000         498186         18.4%                    $0                    $0                  $0\n",
+      "   $10001 to $20000         233000          8.6%                    $0                    $4             $847688\n",
+      "   $20001 to $30000         171515          6.3%                   $40                   $56            $2756262\n",
+      "   $30001 to $40000         157010          5.8%                  $149                  $135           $-2140517\n",
+      "   $40001 to $50000         132402          4.9%                  $399                  $301          $-12939930\n",
+      "   $50001 to $75000         245406          9.1%                  $701                  $576          $-30530120\n",
+      "  $75001 to $100000         165713          6.1%                 $1452                 $1261          $-31638784\n",
+      " $100001 to $150000         225396          8.3%                 $2929                 $3055           $28517960\n",
+      " $150001 to $200000          42792          1.6%                 $5236                 $5812           $24642470\n",
+      " $200001 to $300000          55391          2.0%                 $9952                $10126            $9646339\n",
+      " $300001 to $500000          32748          1.2%                $16226                $15433          $-25961084\n",
+      "$500001 to $1000000          11418          0.4%                $31912                $29003          $-33216482\n",
+      "      Over $1000000           6993          0.3%               $171527               $151221         $-141996240\n",
+      "              Total        2705850        100.0%                 $1488                 $1410         $-212012432\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Display key columns for quick comparison\n",
+    "display_cols = [\n",
+    "    \"Federal AGI Range\", \"Est # Returns\", \"Est % Returns\",\n",
+    "    \"Old Avg Tax Liability\", \"New Avg Tax Liability\", \"Total Dollar Change\"\n",
+    "]\n",
+    "print(\"\\nKEY METRICS:\")\n",
+    "print(df_results[display_cols].to_string(index=False))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "cell-9",
+   "metadata": {},
+   "source": [
+    "## Side-by-Side Comparison with RFA"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "id": "cell-10",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "====================================================================================================\n",
+      "POLICYENGINE (Test) vs RFA COMPARISON (5.21% Rate)\n",
+      "====================================================================================================\n",
+      "          AGI Range PE Returns RFA Returns     PE Impact    RFA Impact         Diff\n",
+      "                $0*    727,881      78,854            $0     $-671,000    $+671,000\n",
+      "       $1 to $10000    498,186     286,253            $0    $1,653,000  $-1,653,000\n",
+      "   $10001 to $20000    233,000     310,122      $847,688    $2,867,000  $-2,019,312\n",
+      "   $20001 to $30000    171,515     275,560    $2,756,262      $762,000  $+1,994,262\n",
+      "   $30001 to $40000    157,010     269,566   $-2,140,517  $-19,416,000 $+17,275,483\n",
+      "   $40001 to $50000    132,402     234,386  $-12,939,930  $-42,568,000 $+29,628,070\n",
+      "   $50001 to $75000    245,406     407,593  $-30,530,120  $-89,935,000 $+59,404,880\n",
+      "  $75001 to $100000    165,713     250,437  $-31,638,784  $-48,624,000 $+16,985,216\n",
+      " $100001 to $150000    225,396     298,343   $28,517,960  $-26,092,000 $+54,609,960\n",
+      " $150001 to $200000     42,792     143,398   $24,642,470   $23,766,000    $+876,470\n",
+      " $200001 to $300000     55,391     109,340    $9,646,339    $3,955,000  $+5,691,339\n",
+      " $300001 to $500000     32,748      56,123  $-25,961,084  $-32,054,000  $+6,092,916\n",
+      "$500001 to $1000000     11,418      25,664  $-33,216,482  $-37,381,000  $+4,164,518\n",
+      "      Over $1000000      6,993      11,936 $-141,996,240  $-44,989,000 $-97,007,240\n",
+      "              Total  2,705,850   2,757,573 $-212,012,432 $-308,700,000 $+96,687,568\n",
+      "====================================================================================================\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Load RFA data\n",
+    "rfa_df = pd.read_csv('../rfa_h4216_5.21_analysis.csv')\n",
+    "\n",
+    "def parse_dollar(val):\n",
+    "    if isinstance(val, str):\n",
+    "        return float(val.replace('$', '').replace(',', '').replace('%', ''))\n",
+    "    return val\n",
+    "\n",
+    "def parse_pct(val):\n",
+    "    if isinstance(val, str):\n",
+    "        return float(val.replace('%', ''))\n",
+    "    return val\n",
+    "\n",
+    "# Create comparison\n",
+    "comparison = []\n",
+    "for idx, pe_row in df_results.iterrows():\n",
+    "    agi_range = pe_row['Federal AGI Range']\n",
+    "    rfa_match = rfa_df[rfa_df['Federal AGI Range'] == agi_range]\n",
+    "    \n",
+    "    pe_returns = pe_row['Est # Returns']\n",
+    "    pe_impact = parse_dollar(pe_row['Total Dollar Change'])\n",
+    "    \n",
+    "    if len(rfa_match) > 0:\n",
+    "        rfa_returns = rfa_match['Est # Returns'].values[0]\n",
+    "        rfa_impact = parse_dollar(rfa_match['Total Dollar Change'].values[0])\n",
+    "    else:\n",
+    "        rfa_returns = 0\n",
+    "        rfa_impact = 0\n",
+    "    \n",
+    "    comparison.append({\n",
+    "        'AGI Range': agi_range,\n",
+    "        'PE Returns': f\"{pe_returns:,}\",\n",
+    "        'RFA Returns': f\"{rfa_returns:,}\" if rfa_returns else \"N/A\",\n",
+    "        'PE Impact': f\"${pe_impact:,.0f}\",\n",
+    "        'RFA Impact': f\"${rfa_impact:,.0f}\" if rfa_impact else \"N/A\",\n",
+    "        'Diff': f\"${pe_impact - rfa_impact:+,.0f}\" if rfa_impact else \"N/A\"\n",
+    "    })\n",
+    "\n",
+    "comparison_df = pd.DataFrame(comparison)\n",
+    "print(\"\\n\" + \"=\"*100)\n",
+    "print(\"POLICYENGINE (Test) vs RFA COMPARISON (5.21% Rate)\")\n",
+    "print(\"=\"*100)\n",
+    "print(comparison_df.to_string(index=False))\n",
+    "print(\"=\"*100)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "id": "cell-11",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "========================================================================================================================\n",
+      "FULL POLICYENGINE ANALYSIS (RFA Format)\n",
+      "========================================================================================================================\n",
+      "  Federal AGI Range  Est # Returns Est % Returns Old Avg Tax Liability New Avg Tax Liability  Returns with Tax Change % Returns in Range with Change Old Avg Tax (Changed) New Avg Tax (Changed) Avg Tax Change Total Dollar Change  Tax Decrease # Returns Tax Decrease % in Range Total Decrease Amount Avg Decrease Amount  Tax Increase # Returns Tax Increase % in Range Total Increase Amount Avg Increase Amount  No Tax Change # Returns No Change % Returns  Zero Tax # Returns Zero Tax % Returns\n",
+      "                $0*         727881         26.9%                    $0                    $0                        0                           0.0%                    $0                    $0             $0                  $0                       0                    0.0%                    $0                  $0                       0                    0.0%                    $0                  $0                   727881              100.0%              727881             100.0%\n",
+      "       $1 to $10000         498186         18.4%                    $0                    $0                        0                           0.0%                    $0                    $0             $0                  $0                       0                    0.0%                    $0                  $0                       0                    0.0%                    $0                  $0                   498186              100.0%              498186             100.0%\n",
+      "   $10001 to $20000         233000          8.6%                    $0                    $4                    16527                           7.1%                    $0                   $51            $51             $847688                       0                    0.0%                    $0                  $0                   16527                    7.1%               $847510                 $51                   216473               92.9%              215471              92.5%\n",
+      "   $20001 to $30000         171515          6.3%                   $40                   $56                    48979                          28.6%                  $131                  $187            $56            $2756262                    2691                    1.6%               $-22726                 $-8                   46288                   27.0%              $2778858                 $60                   122536               71.4%              121168              70.6%\n",
+      "   $30001 to $40000         157010          5.8%                  $149                  $135                    70118                          44.7%                  $333                  $302           $-31           $-2140517                   45821                   29.2%             $-3836658                $-84                   24298                   15.5%              $1696106                 $70                    86892               55.3%               86762              55.3%\n",
+      "   $40001 to $50000         132402          4.9%                  $399                  $301                    95777                          72.3%                  $548                  $413          $-135          $-12939930                   49802                   37.6%            $-16742836               $-336                   45975                   34.7%              $3801853                 $83                    36624               27.7%               35193              26.6%\n",
+      "   $50001 to $75000         245406          9.1%                  $701                  $576                   205400                          83.7%                  $836                  $687          $-149          $-30530120                  139791                   57.0%            $-40495060               $-290                   65609                   26.7%              $9964432                $152                    40007               16.3%               39028              15.9%\n",
+      "  $75001 to $100000         165713          6.1%                 $1452                 $1261                   163885                          98.9%                 $1468                 $1275          $-193          $-31638784                  120428                   72.7%            $-44416856               $-369                   43457                   26.2%             $12778093                $294                     1828                1.1%                1759               1.1%\n",
+      " $100001 to $150000         225396          8.3%                 $2929                 $3055                   220631                          97.9%                 $2992                 $3121           $129           $28517960                  121628                   54.0%            $-24284616               $-200                   99003                   43.9%             $52802576                $533                     4765                2.1%                4765               2.1%\n",
+      " $150001 to $200000          42792          1.6%                 $5236                 $5812                    41448                          96.9%                 $5235                 $5829           $595           $24642470                    7562                   17.7%              $-786251               $-104                   33886                   79.2%             $25429746                $750                     1344                3.1%                   0               0.0%\n",
+      " $200001 to $300000          55391          2.0%                 $9952                $10126                    55391                         100.0%                 $9952                $10126           $174            $9646339                   25962                   46.9%             $-7259498               $-280                   29429                   53.1%             $16905836                $574                        0                0.0%                   0               0.0%\n",
+      " $300001 to $500000          32748          1.2%                $16226                $15433                    32748                         100.0%                $16226                $15433          $-793          $-25961084                   26670                   81.4%            $-27887880              $-1046                    6078                   18.6%              $1926795                $317                        0                0.0%                   0               0.0%\n",
+      "$500001 to $1000000          11418          0.4%                $31912                $29003                    11417                         100.0%                $31913                $29004         $-2909          $-33216482                   11403                   99.9%            $-33299206              $-2920                      15                    0.1%                $82722               $5703                        0                0.0%                   0               0.0%\n",
+      "      Over $1000000           6993          0.3%               $171527               $151221                     6993                         100.0%               $171530               $151223        $-20306         $-141996240                    6961                   99.5%           $-146692704             $-21074                      32                    0.5%              $4696465             $147081                        0                0.0%                   0               0.0%\n",
+      "              Total        2705850        100.0%                 $1488                 $1410                   969313                          35.8%                 $4145                 $3926          $-219         $-212012432                  558718                   20.6%           $-345724288               $-619                  410595                   15.2%            $133710992                $326                  1736536               64.2%             1730213              63.9%\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Full results table\n",
+    "print(\"\\n\" + \"=\"*120)\n",
+    "print(\"FULL POLICYENGINE ANALYSIS (RFA Format)\")\n",
+    "print(\"=\"*120)\n",
+    "pd.set_option('display.max_columns', None)\n",
+    "pd.set_option('display.width', None)\n",
+    "print(df_results.to_string(index=False))"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.11.5"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/us/states/sc/rfa_h4216_analysis.csv b/us/states/sc/h4216_analysis/5.39_rate/rfa_h4216_analysis.csv
similarity index 100%
rename from us/states/sc/rfa_h4216_analysis.csv
rename to us/states/sc/h4216_analysis/5.39_rate/rfa_h4216_analysis.csv
diff --git a/us/states/sc/h4216_analysis/5.39_rate/state/pe_h4216_5.39_state_analysis.csv b/us/states/sc/h4216_analysis/5.39_rate/state/pe_h4216_5.39_state_analysis.csv
new file mode 100644
index 0000000..6ed079c
--- /dev/null
+++ b/us/states/sc/h4216_analysis/5.39_rate/state/pe_h4216_5.39_state_analysis.csv
@@ -0,0 +1,16 @@
+Federal AGI Range,Est # Returns,Est % Returns,Old Avg Tax Liability,New Avg Tax Liability,Returns with Tax Change,% Returns in Range with Change,Old Avg Tax (Changed),New Avg Tax (Changed),Avg Tax Change,Total Dollar Change,Tax Decrease # Returns,Tax Decrease % in Range,Total Decrease Amount,Avg Decrease Amount,Tax Increase # Returns,Tax Increase % in Range,Total Increase Amount,Avg Increase Amount,No Tax Change # Returns,No Change % Returns,Zero Tax # Returns,Zero Tax % Returns
+$0*,619010,21.1%,$0,$0,0,0.0%,$0,$0,$0,$0,0,0.0%,$0,$0,0,0.0%,$0,$0,619010,100.0%,619010,100.0%
+$1 to $10000,502276,17.1%,$0,$0,0,0.0%,$0,$0,$0,$0,0,0.0%,$0,$0,0,0.0%,$0,$0,502276,100.0%,502276,100.0%
+$10001 to $20000,279412,9.5%,$0,$10,53961,19.3%,$0,$50,$50,$2672942,0,0.0%,$0,$0,53961,19.3%,$2672922,$50,225451,80.7%,225413,80.7%
+$20001 to $30000,252863,8.6%,$64,$101,136052,53.8%,$119,$188,$68,$9294693,5029,2.0%,$-40734,$-8,131023,51.8%,$9335378,$71,116811,46.2%,116751,46.2%
+$30001 to $40000,215980,7.4%,$225,$200,135926,62.9%,$356,$316,$-40,$-5431497,88710,41.1%,$-8472465,$-96,47216,21.9%,$3040994,$64,80055,37.1%,79265,36.7%
+$40001 to $50000,197525,6.7%,$547,$406,152733,77.3%,$706,$524,$-182,$-27750680,99989,50.6%,$-33876124,$-339,52744,26.7%,$6125390,$116,44792,22.7%,44131,22.3%
+$50001 to $75000,300857,10.2%,$822,$734,254734,84.7%,$971,$867,$-104,$-26516064,163843,54.5%,$-42432168,$-259,90891,30.2%,$15916106,$175,46123,15.3%,46125,15.3%
+$75001 to $100000,177284,6.0%,$1781,$1673,168196,94.9%,$1875,$1761,$-114,$-19091546,123948,69.9%,$-33622528,$-271,44248,25.0%,$14531019,$328,9088,5.1%,9124,5.1%
+$100001 to $150000,187946,6.4%,$3292,$3490,186777,99.4%,$3310,$3510,$199,$37224792,80645,42.9%,$-11527897,$-143,106132,56.5%,$48752732,$459,1169,0.6%,1105,0.6%
+$150001 to $200000,73396,2.5%,$6049,$6621,73396,100.0%,$6049,$6621,$572,$41990104,5919,8.1%,$-1521388,$-257,67477,91.9%,$43511488,$645,0,0.0%,0,0.0%
+$200001 to $300000,52882,1.8%,$9164,$9669,52844,99.9%,$9161,$9666,$504,$26656968,6389,12.1%,$-1749618,$-274,46455,87.8%,$28406596,$611,38,0.1%,0,0.0%
+$300001 to $500000,36977,1.3%,$17163,$17280,36977,100.0%,$17163,$17280,$116,$4306962,20370,55.1%,$-12902031,$-633,16607,44.9%,$17208994,$1036,0,0.0%,0,0.0%
+$500001 to $1000000,16526,0.6%,$26140,$25753,16526,100.0%,$26140,$25753,$-387,$-6389232,14096,85.3%,$-14481286,$-1027,2430,14.7%,$8092054,$3331,0,0.0%,0,0.0%
+Over $1000000,22686,0.8%,$139623,$129256,22686,100.0%,$139623,$129256,$-10367,$-235194960,22658,99.9%,$-235526416,$-10395,29,0.1%,$331456,$11553,0,0.0%,0,0.0%
+Total,2935621,100.0%,$2220,$2153,1290809,44.0%,$5048,$4894,$-154,$-198227520,631596,21.5%,$-396152640,$-627,659213,22.5%,$197925120,$300,1644813,56.0%,1643201,56.0%
diff --git a/us/states/sc/h4216_analysis/5.39_rate/state/sc_h4216_5.39_state_analysis.ipynb b/us/states/sc/h4216_analysis/5.39_rate/state/sc_h4216_5.39_state_analysis.ipynb
new file mode 100644
index 0000000..a95395d
--- /dev/null
+++ b/us/states/sc/h4216_analysis/5.39_rate/state/sc_h4216_5.39_state_analysis.ipynb
@@ -0,0 +1,550 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "cell-0",
+   "metadata": {},
+   "source": [
+    "# SC H.4216 Tax Reform Analysis - 5.39% Top Rate (State Dataset)\n",
+    "\n",
+    "This notebook produces analysis in the same format as the RFA fiscal note for direct comparison.\n",
+    "\n",
+    "**Dataset:** `hf://policyengine/policyengine-us-data/states/SC.h5` (Production)\n",
+    "\n",
+    "**Reform:** H.4216 with 5.39% top rate (RFA version)\n",
+    "\n",
+    "**RFA Estimate:** -$119,100,000"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "cell-1",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from policyengine_us import Microsimulation\n",
+    "from policyengine_us.reforms.states.sc.h4216.sc_h4216 import create_sc_h4216\n",
+    "from policyengine_core.reforms import Reform\n",
+    "import pandas as pd\n",
+    "import numpy as np\n",
+    "\n",
+    "SC_DATASET = \"hf://policyengine/policyengine-us-data/states/SC.h5\"\n",
+    "TAX_YEAR = 2026\n",
+    "TOP_RATE = 0.0539  # 5.39% top rate\n",
+    "RFA_ESTIMATE = -119100000"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "id": "cell-2",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Loading simulations...\n",
+      "Done!\n"
+     ]
+    }
+   ],
+   "source": [
+    "def create_h4216_reform(top_rate=0.0539):\n",
+    "    \"\"\"\n",
+    "    SC H.4216 Reform:\n",
+    "    - 1.99% up to $30k\n",
+    "    - top_rate over $30k (default 5.39% for RFA version)\n",
+    "    \"\"\"\n",
+    "    param_reform = Reform.from_dict(\n",
+    "        {\n",
+    "            \"gov.contrib.states.sc.h4216.in_effect\": {\n",
+    "                \"2026-01-01.2100-12-31\": True\n",
+    "            },\n",
+    "            \"gov.contrib.states.sc.h4216.rates[1].rate\": {\n",
+    "                \"2026-01-01.2100-12-31\": top_rate\n",
+    "            }\n",
+    "        },\n",
+    "        country_id=\"us\",\n",
+    "    )\n",
+    "    base_reform = create_sc_h4216()\n",
+    "    return (base_reform, param_reform)\n",
+    "\n",
+    "print(\"Loading simulations...\")\n",
+    "baseline = Microsimulation(dataset=SC_DATASET)\n",
+    "reform_sim = Microsimulation(dataset=SC_DATASET, reform=create_h4216_reform(TOP_RATE))\n",
+    "print(\"Done!\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "id": "cell-3",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Total tax units: 49,486\n",
+      "Weighted tax units: 2,935,621\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Get data - use .values to avoid double-weighting\n",
+    "baseline_tax = baseline.calculate(\"sc_income_tax\", period=TAX_YEAR, map_to=\"tax_unit\").values\n",
+    "reform_tax = reform_sim.calculate(\"sc_income_tax\", period=TAX_YEAR, map_to=\"tax_unit\").values\n",
+    "agi = baseline.calculate(\"adjusted_gross_income\", period=TAX_YEAR, map_to=\"tax_unit\").values\n",
+    "weight = baseline.calculate(\"tax_unit_weight\", period=TAX_YEAR).values\n",
+    "\n",
+    "tax_change = reform_tax - baseline_tax\n",
+    "\n",
+    "print(f\"Total tax units: {len(baseline_tax):,}\")\n",
+    "print(f\"Weighted tax units: {weight.sum():,.0f}\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "id": "cell-4",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Bracket analysis complete!\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Define income brackets matching RFA exactly\n",
+    "income_brackets = [\n",
+    "    (float('-inf'), 0, \"$0*\"),\n",
+    "    (0, 10000, \"$1 to $10000\"),\n",
+    "    (10000, 20000, \"$10001 to $20000\"),\n",
+    "    (20000, 30000, \"$20001 to $30000\"),\n",
+    "    (30000, 40000, \"$30001 to $40000\"),\n",
+    "    (40000, 50000, \"$40001 to $50000\"),\n",
+    "    (50000, 75000, \"$50001 to $75000\"),\n",
+    "    (75000, 100000, \"$75001 to $100000\"),\n",
+    "    (100000, 150000, \"$100001 to $150000\"),\n",
+    "    (150000, 200000, \"$150001 to $200000\"),\n",
+    "    (200000, 300000, \"$200001 to $300000\"),\n",
+    "    (300000, 500000, \"$300001 to $500000\"),\n",
+    "    (500000, 1000000, \"$500001 to $1000000\"),\n",
+    "    (1000000, float('inf'), \"Over $1000000\")\n",
+    "]\n",
+    "\n",
+    "total_weight = weight.sum()\n",
+    "results = []\n",
+    "\n",
+    "for lower, upper, label in income_brackets:\n",
+    "    if lower == float('-inf'):\n",
+    "        mask = agi <= upper\n",
+    "    elif upper == float('inf'):\n",
+    "        mask = agi > lower\n",
+    "    else:\n",
+    "        mask = (agi > lower) & (agi <= upper)\n",
+    "    \n",
+    "    if mask.sum() == 0:\n",
+    "        continue\n",
+    "    \n",
+    "    # Basic stats\n",
+    "    est_returns = weight[mask].sum()\n",
+    "    pct_returns = est_returns / total_weight * 100\n",
+    "    \n",
+    "    old_avg_tax = np.average(baseline_tax[mask], weights=weight[mask]) if est_returns > 0 else 0\n",
+    "    new_avg_tax = np.average(reform_tax[mask], weights=weight[mask]) if est_returns > 0 else 0\n",
+    "    \n",
+    "    # Returns with tax change (threshold $1)\n",
+    "    change_mask = mask & (np.abs(tax_change) > 1)\n",
+    "    returns_with_change = weight[change_mask].sum()\n",
+    "    pct_with_change = returns_with_change / est_returns * 100 if est_returns > 0 else 0\n",
+    "    \n",
+    "    if returns_with_change > 0:\n",
+    "        old_avg_changed = np.average(baseline_tax[change_mask], weights=weight[change_mask])\n",
+    "        new_avg_changed = np.average(reform_tax[change_mask], weights=weight[change_mask])\n",
+    "        avg_change = np.average(tax_change[change_mask], weights=weight[change_mask])\n",
+    "    else:\n",
+    "        old_avg_changed = 0\n",
+    "        new_avg_changed = 0\n",
+    "        avg_change = 0\n",
+    "    \n",
+    "    total_change = (tax_change[mask] * weight[mask]).sum()\n",
+    "    \n",
+    "    # Tax decrease\n",
+    "    decrease_mask = mask & (tax_change < -1)\n",
+    "    decrease_returns = weight[decrease_mask].sum()\n",
+    "    decrease_pct = decrease_returns / est_returns * 100 if est_returns > 0 else 0\n",
+    "    total_decrease = (tax_change[decrease_mask] * weight[decrease_mask]).sum() if decrease_returns > 0 else 0\n",
+    "    avg_decrease = np.average(tax_change[decrease_mask], weights=weight[decrease_mask]) if decrease_returns > 0 else 0\n",
+    "    \n",
+    "    # Tax increase\n",
+    "    increase_mask = mask & (tax_change > 1)\n",
+    "    increase_returns = weight[increase_mask].sum()\n",
+    "    increase_pct = increase_returns / est_returns * 100 if est_returns > 0 else 0\n",
+    "    total_increase = (tax_change[increase_mask] * weight[increase_mask]).sum() if increase_returns > 0 else 0\n",
+    "    avg_increase = np.average(tax_change[increase_mask], weights=weight[increase_mask]) if increase_returns > 0 else 0\n",
+    "    \n",
+    "    # No change\n",
+    "    no_change_mask = mask & (np.abs(tax_change) <= 1)\n",
+    "    no_change_returns = weight[no_change_mask].sum()\n",
+    "    no_change_pct = no_change_returns / est_returns * 100 if est_returns > 0 else 0\n",
+    "    \n",
+    "    # Zero tax\n",
+    "    zero_tax_mask = mask & (reform_tax <= 0)\n",
+    "    zero_tax_returns = weight[zero_tax_mask].sum()\n",
+    "    zero_tax_pct = zero_tax_returns / est_returns * 100 if est_returns > 0 else 0\n",
+    "    \n",
+    "    results.append({\n",
+    "        \"Federal AGI Range\": label,\n",
+    "        \"Est # Returns\": int(round(est_returns)),\n",
+    "        \"Est % Returns\": f\"{pct_returns:.1f}%\",\n",
+    "        \"Old Avg Tax Liability\": f\"${int(round(old_avg_tax))}\",\n",
+    "        \"New Avg Tax Liability\": f\"${int(round(new_avg_tax))}\",\n",
+    "        \"Returns with Tax Change\": int(round(returns_with_change)),\n",
+    "        \"% Returns in Range with Change\": f\"{pct_with_change:.1f}%\",\n",
+    "        \"Old Avg Tax (Changed)\": f\"${int(round(old_avg_changed))}\",\n",
+    "        \"New Avg Tax (Changed)\": f\"${int(round(new_avg_changed))}\",\n",
+    "        \"Avg Tax Change\": f\"${int(round(avg_change))}\",\n",
+    "        \"Total Dollar Change\": f\"${int(round(total_change))}\",\n",
+    "        \"Tax Decrease # Returns\": int(round(decrease_returns)),\n",
+    "        \"Tax Decrease % in Range\": f\"{decrease_pct:.1f}%\",\n",
+    "        \"Total Decrease Amount\": f\"${int(round(total_decrease))}\",\n",
+    "        \"Avg Decrease Amount\": f\"${int(round(avg_decrease))}\",\n",
+    "        \"Tax Increase # Returns\": int(round(increase_returns)),\n",
+    "        \"Tax Increase % in Range\": f\"{increase_pct:.1f}%\",\n",
+    "        \"Total Increase Amount\": f\"${int(round(total_increase))}\",\n",
+    "        \"Avg Increase Amount\": f\"${int(round(avg_increase))}\",\n",
+    "        \"No Tax Change # Returns\": int(round(no_change_returns)),\n",
+    "        \"No Change % Returns\": f\"{no_change_pct:.1f}%\",\n",
+    "        \"Zero Tax # Returns\": int(round(zero_tax_returns)),\n",
+    "        \"Zero Tax % Returns\": f\"{zero_tax_pct:.1f}%\"\n",
+    "    })\n",
+    "\n",
+    "print(\"Bracket analysis complete!\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "id": "cell-5",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Totals calculated!\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Calculate totals\n",
+    "change_mask_all = np.abs(tax_change) > 1\n",
+    "decrease_mask_all = tax_change < -1\n",
+    "increase_mask_all = tax_change > 1\n",
+    "no_change_mask_all = np.abs(tax_change) <= 1\n",
+    "zero_tax_mask_all = reform_tax <= 0\n",
+    "\n",
+    "total_old_avg = np.average(baseline_tax, weights=weight)\n",
+    "total_new_avg = np.average(reform_tax, weights=weight)\n",
+    "total_change_amount = (tax_change * weight).sum()\n",
+    "\n",
+    "returns_with_change_all = weight[change_mask_all].sum()\n",
+    "old_avg_changed_all = np.average(baseline_tax[change_mask_all], weights=weight[change_mask_all]) if returns_with_change_all > 0 else 0\n",
+    "new_avg_changed_all = np.average(reform_tax[change_mask_all], weights=weight[change_mask_all]) if returns_with_change_all > 0 else 0\n",
+    "avg_change_all = np.average(tax_change[change_mask_all], weights=weight[change_mask_all]) if returns_with_change_all > 0 else 0\n",
+    "\n",
+    "decrease_returns_all = weight[decrease_mask_all].sum()\n",
+    "total_decrease_all = (tax_change[decrease_mask_all] * weight[decrease_mask_all]).sum()\n",
+    "avg_decrease_all = np.average(tax_change[decrease_mask_all], weights=weight[decrease_mask_all]) if decrease_returns_all > 0 else 0\n",
+    "\n",
+    "increase_returns_all = weight[increase_mask_all].sum()\n",
+    "total_increase_all = (tax_change[increase_mask_all] * weight[increase_mask_all]).sum()\n",
+    "avg_increase_all = np.average(tax_change[increase_mask_all], weights=weight[increase_mask_all]) if increase_returns_all > 0 else 0\n",
+    "\n",
+    "no_change_returns_all = weight[no_change_mask_all].sum()\n",
+    "zero_tax_returns_all = weight[zero_tax_mask_all].sum()\n",
+    "\n",
+    "results.append({\n",
+    "    \"Federal AGI Range\": \"Total\",\n",
+    "    \"Est # Returns\": int(round(total_weight)),\n",
+    "    \"Est % Returns\": \"100.0%\",\n",
+    "    \"Old Avg Tax Liability\": f\"${int(round(total_old_avg))}\",\n",
+    "    \"New Avg Tax Liability\": f\"${int(round(total_new_avg))}\",\n",
+    "    \"Returns with Tax Change\": int(round(returns_with_change_all)),\n",
+    "    \"% Returns in Range with Change\": f\"{returns_with_change_all / total_weight * 100:.1f}%\",\n",
+    "    \"Old Avg Tax (Changed)\": f\"${int(round(old_avg_changed_all))}\",\n",
+    "    \"New Avg Tax (Changed)\": f\"${int(round(new_avg_changed_all))}\",\n",
+    "    \"Avg Tax Change\": f\"${int(round(avg_change_all))}\",\n",
+    "    \"Total Dollar Change\": f\"${int(round(total_change_amount))}\",\n",
+    "    \"Tax Decrease # Returns\": int(round(decrease_returns_all)),\n",
+    "    \"Tax Decrease % in Range\": f\"{decrease_returns_all / total_weight * 100:.1f}%\",\n",
+    "    \"Total Decrease Amount\": f\"${int(round(total_decrease_all))}\",\n",
+    "    \"Avg Decrease Amount\": f\"${int(round(avg_decrease_all))}\",\n",
+    "    \"Tax Increase # Returns\": int(round(increase_returns_all)),\n",
+    "    \"Tax Increase % in Range\": f\"{increase_returns_all / total_weight * 100:.1f}%\",\n",
+    "    \"Total Increase Amount\": f\"${int(round(total_increase_all))}\",\n",
+    "    \"Avg Increase Amount\": f\"${int(round(avg_increase_all))}\",\n",
+    "    \"No Tax Change # Returns\": int(round(no_change_returns_all)),\n",
+    "    \"No Change % Returns\": f\"{no_change_returns_all / total_weight * 100:.1f}%\",\n",
+    "    \"Zero Tax # Returns\": int(round(zero_tax_returns_all)),\n",
+    "    \"Zero Tax % Returns\": f\"{zero_tax_returns_all / total_weight * 100:.1f}%\"\n",
+    "})\n",
+    "\n",
+    "df_results = pd.DataFrame(results)\n",
+    "print(\"Totals calculated!\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "id": "cell-6",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "====================================================================================================\n",
+      "H.4216 - POLICYENGINE ANALYSIS (State Dataset, 5.39% Top Rate)\n",
+      "====================================================================================================\n",
+      "\n",
+      "Total Returns: 2,935,621\n",
+      "General Fund Impact: $-198,227,520\n",
+      "\n",
+      "RFA Estimate: $-119,100,000\n",
+      "Difference: $-79,127,520\n",
+      "Accuracy: 33.6%\n",
+      "====================================================================================================\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Display summary\n",
+    "print(\"=\"*100)\n",
+    "print(f\"H.4216 - POLICYENGINE ANALYSIS (State Dataset, {TOP_RATE*100:.2f}% Top Rate)\")\n",
+    "print(\"=\"*100)\n",
+    "print(f\"\\nTotal Returns: {int(total_weight):,}\")\n",
+    "print(f\"General Fund Impact: ${total_change_amount:,.0f}\")\n",
+    "print(f\"\\nRFA Estimate: ${RFA_ESTIMATE:,}\")\n",
+    "print(f\"Difference: ${total_change_amount - RFA_ESTIMATE:,.0f}\")\n",
+    "print(f\"Accuracy: {(1 - abs(total_change_amount - RFA_ESTIMATE) / abs(RFA_ESTIMATE)) * 100:.1f}%\")\n",
+    "print(\"=\"*100)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "id": "cell-7",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Exported to: pe_h4216_5.39_state_analysis.csv\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Export to CSV in RFA format\n",
+    "df_results.to_csv('pe_h4216_5.39_state_analysis.csv', index=False)\n",
+    "print(\"Exported to: pe_h4216_5.39_state_analysis.csv\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "id": "cell-8",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "KEY METRICS:\n",
+      "  Federal AGI Range  Est # Returns Est % Returns Old Avg Tax Liability New Avg Tax Liability Total Dollar Change\n",
+      "                $0*         619010         21.1%                    $0                    $0                  $0\n",
+      "       $1 to $10000         502276         17.1%                    $0                    $0                  $0\n",
+      "   $10001 to $20000         279412          9.5%                    $0                   $10            $2672942\n",
+      "   $20001 to $30000         252863          8.6%                   $64                  $101            $9294693\n",
+      "   $30001 to $40000         215980          7.4%                  $225                  $200           $-5431497\n",
+      "   $40001 to $50000         197525          6.7%                  $547                  $406          $-27750680\n",
+      "   $50001 to $75000         300857         10.2%                  $822                  $734          $-26516064\n",
+      "  $75001 to $100000         177284          6.0%                 $1781                 $1673          $-19091546\n",
+      " $100001 to $150000         187946          6.4%                 $3292                 $3490           $37224792\n",
+      " $150001 to $200000          73396          2.5%                 $6049                 $6621           $41990104\n",
+      " $200001 to $300000          52882          1.8%                 $9164                 $9669           $26656968\n",
+      " $300001 to $500000          36977          1.3%                $17163                $17280            $4306962\n",
+      "$500001 to $1000000          16526          0.6%                $26140                $25753           $-6389232\n",
+      "      Over $1000000          22686          0.8%               $139623               $129256         $-235194960\n",
+      "              Total        2935621        100.0%                 $2220                 $2153         $-198227520\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Display key columns for quick comparison\n",
+    "display_cols = [\n",
+    "    \"Federal AGI Range\", \"Est # Returns\", \"Est % Returns\",\n",
+    "    \"Old Avg Tax Liability\", \"New Avg Tax Liability\", \"Total Dollar Change\"\n",
+    "]\n",
+    "print(\"\\nKEY METRICS:\")\n",
+    "print(df_results[display_cols].to_string(index=False))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "cell-9",
+   "metadata": {},
+   "source": [
+    "## Side-by-Side Comparison with RFA"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "id": "cell-10",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "====================================================================================================\n",
+      "POLICYENGINE (State) vs RFA COMPARISON (5.39% Rate)\n",
+      "====================================================================================================\n",
+      "          AGI Range PE Returns RFA Returns     PE Impact    RFA Impact          Diff\n",
+      "                $0*    619,010      78,854            $0     $-571,000     $+571,000\n",
+      "       $1 to $10000    502,276     286,253            $0    $1,655,000   $-1,655,000\n",
+      "   $10001 to $20000    279,412     310,122    $2,672,942    $2,872,000     $-199,058\n",
+      "   $20001 to $30000    252,863     275,560    $9,294,693      $769,000   $+8,525,693\n",
+      "   $30001 to $40000    215,980     269,566   $-5,431,497  $-19,360,000  $+13,928,503\n",
+      "   $40001 to $50000    197,525     234,386  $-27,750,680  $-41,986,000  $+14,235,320\n",
+      "   $50001 to $75000    300,857     407,593  $-26,516,064  $-82,146,000  $+55,629,936\n",
+      "  $75001 to $100000    177,284     250,437  $-19,091,546  $-36,461,000  $+17,369,454\n",
+      " $100001 to $150000    187,946     298,343   $37,224,792    $3,115,000  $+34,109,792\n",
+      " $150001 to $200000     73,396     143,398   $41,990,104   $50,933,000   $-8,942,896\n",
+      " $200001 to $300000     52,882     109,340   $26,656,968   $36,718,000  $-10,061,032\n",
+      " $300001 to $500000     36,977      56,123    $4,306,962   $-4,627,000   $+8,933,962\n",
+      "$500001 to $1000000     16,526      25,664   $-6,389,232  $-16,195,000   $+9,805,768\n",
+      "      Over $1000000     22,686      11,936 $-235,194,960  $-13,767,000 $-221,427,960\n",
+      "              Total  2,935,621   2,757,573 $-198,227,520 $-119,100,000  $-79,127,520\n",
+      "====================================================================================================\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Load RFA data\n",
+    "rfa_df = pd.read_csv('../rfa_h4216_analysis.csv')\n",
+    "\n",
+    "def parse_dollar(val):\n",
+    "    if isinstance(val, str):\n",
+    "        return float(val.replace('$', '').replace(',', '').replace('%', ''))\n",
+    "    return val\n",
+    "\n",
+    "# Create comparison\n",
+    "comparison = []\n",
+    "for idx, pe_row in df_results.iterrows():\n",
+    "    agi_range = pe_row['Federal AGI Range']\n",
+    "    rfa_match = rfa_df[rfa_df['Federal AGI Range'] == agi_range]\n",
+    "    \n",
+    "    pe_returns = pe_row['Est # Returns']\n",
+    "    pe_impact = parse_dollar(pe_row['Total Dollar Change'])\n",
+    "    \n",
+    "    if len(rfa_match) > 0:\n",
+    "        rfa_returns = rfa_match['Est # Returns'].values[0]\n",
+    "        rfa_impact = parse_dollar(rfa_match['Total Dollar Change'].values[0])\n",
+    "    else:\n",
+    "        rfa_returns = 0\n",
+    "        rfa_impact = 0\n",
+    "    \n",
+    "    comparison.append({\n",
+    "        'AGI Range': agi_range,\n",
+    "        'PE Returns': f\"{pe_returns:,}\",\n",
+    "        'RFA Returns': f\"{rfa_returns:,}\" if rfa_returns else \"N/A\",\n",
+    "        'PE Impact': f\"${pe_impact:,.0f}\",\n",
+    "        'RFA Impact': f\"${rfa_impact:,.0f}\" if rfa_impact else \"N/A\",\n",
+    "        'Diff': f\"${pe_impact - rfa_impact:+,.0f}\" if rfa_impact else \"N/A\"\n",
+    "    })\n",
+    "\n",
+    "comparison_df = pd.DataFrame(comparison)\n",
+    "print(\"\\n\" + \"=\"*100)\n",
+    "print(\"POLICYENGINE (State) vs RFA COMPARISON (5.39% Rate)\")\n",
+    "print(\"=\"*100)\n",
+    "print(comparison_df.to_string(index=False))\n",
+    "print(\"=\"*100)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "id": "cell-11",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "========================================================================================================================\n",
+      "FULL POLICYENGINE ANALYSIS (RFA Format)\n",
+      "========================================================================================================================\n",
+      "  Federal AGI Range  Est # Returns Est % Returns Old Avg Tax Liability New Avg Tax Liability  Returns with Tax Change % Returns in Range with Change Old Avg Tax (Changed) New Avg Tax (Changed) Avg Tax Change Total Dollar Change  Tax Decrease # Returns Tax Decrease % in Range Total Decrease Amount Avg Decrease Amount  Tax Increase # Returns Tax Increase % in Range Total Increase Amount Avg Increase Amount  No Tax Change # Returns No Change % Returns  Zero Tax # Returns Zero Tax % Returns\n",
+      "                $0*         619010         21.1%                    $0                    $0                        0                           0.0%                    $0                    $0             $0                  $0                       0                    0.0%                    $0                  $0                       0                    0.0%                    $0                  $0                   619010              100.0%              619010             100.0%\n",
+      "       $1 to $10000         502276         17.1%                    $0                    $0                        0                           0.0%                    $0                    $0             $0                  $0                       0                    0.0%                    $0                  $0                       0                    0.0%                    $0                  $0                   502276              100.0%              502276             100.0%\n",
+      "   $10001 to $20000         279412          9.5%                    $0                   $10                    53961                          19.3%                    $0                   $50            $50            $2672942                       0                    0.0%                    $0                  $0                   53961                   19.3%              $2672922                 $50                   225451               80.7%              225413              80.7%\n",
+      "   $20001 to $30000         252863          8.6%                   $64                  $101                   136052                          53.8%                  $119                  $188            $68            $9294693                    5029                    2.0%               $-40734                 $-8                  131023                   51.8%              $9335378                 $71                   116811               46.2%              116751              46.2%\n",
+      "   $30001 to $40000         215980          7.4%                  $225                  $200                   135926                          62.9%                  $356                  $316           $-40           $-5431497                   88710                   41.1%             $-8472465                $-96                   47216                   21.9%              $3040994                 $64                    80055               37.1%               79265              36.7%\n",
+      "   $40001 to $50000         197525          6.7%                  $547                  $406                   152733                          77.3%                  $706                  $524          $-182          $-27750680                   99989                   50.6%            $-33876124               $-339                   52744                   26.7%              $6125390                $116                    44792               22.7%               44131              22.3%\n",
+      "   $50001 to $75000         300857         10.2%                  $822                  $734                   254734                          84.7%                  $971                  $867          $-104          $-26516064                  163843                   54.5%            $-42432168               $-259                   90891                   30.2%             $15916106                $175                    46123               15.3%               46125              15.3%\n",
+      "  $75001 to $100000         177284          6.0%                 $1781                 $1673                   168196                          94.9%                 $1875                 $1761          $-114          $-19091546                  123948                   69.9%            $-33622528               $-271                   44248                   25.0%             $14531019                $328                     9088                5.1%                9124               5.1%\n",
+      " $100001 to $150000         187946          6.4%                 $3292                 $3490                   186777                          99.4%                 $3310                 $3510           $199           $37224792                   80645                   42.9%            $-11527897               $-143                  106132                   56.5%             $48752732                $459                     1169                0.6%                1105               0.6%\n",
+      " $150001 to $200000          73396          2.5%                 $6049                 $6621                    73396                         100.0%                 $6049                 $6621           $572           $41990104                    5919                    8.1%             $-1521388               $-257                   67477                   91.9%             $43511488                $645                        0                0.0%                   0               0.0%\n",
+      " $200001 to $300000          52882          1.8%                 $9164                 $9669                    52844                          99.9%                 $9161                 $9666           $504           $26656968                    6389                   12.1%             $-1749618               $-274                   46455                   87.8%             $28406596                $611                       38                0.1%                   0               0.0%\n",
+      " $300001 to $500000          36977          1.3%                $17163                $17280                    36977                         100.0%                $17163                $17280           $116            $4306962                   20370                   55.1%            $-12902031               $-633                   16607                   44.9%             $17208994               $1036                        0                0.0%                   0               0.0%\n",
+      "$500001 to $1000000          16526          0.6%                $26140                $25753                    16526                         100.0%                $26140                $25753          $-387           $-6389232                   14096                   85.3%            $-14481286              $-1027                    2430                   14.7%              $8092054               $3331                        0                0.0%                   0               0.0%\n",
+      "      Over $1000000          22686          0.8%               $139623               $129256                    22686                         100.0%               $139623               $129256        $-10367         $-235194960                   22658                   99.9%           $-235526416             $-10395                      29                    0.1%               $331456              $11553                        0                0.0%                   0               0.0%\n",
+      "              Total        2935621        100.0%                 $2220                 $2153                  1290809                          44.0%                 $5048                 $4894          $-154         $-198227520                  631596                   21.5%           $-396152640               $-627                  659213                   22.5%            $197925120                $300                  1644813               56.0%             1643201              56.0%\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Full results table\n",
+    "print(\"\\n\" + \"=\"*120)\n",
+    "print(\"FULL POLICYENGINE ANALYSIS (RFA Format)\")\n",
+    "print(\"=\"*120)\n",
+    "pd.set_option('display.max_columns', None)\n",
+    "pd.set_option('display.width', None)\n",
+    "print(df_results.to_string(index=False))"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.11.5"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/us/states/sc/pe_h4216_test_analysis.csv b/us/states/sc/h4216_analysis/5.39_rate/test/pe_h4216_test_analysis.csv
similarity index 100%
rename from us/states/sc/pe_h4216_test_analysis.csv
rename to us/states/sc/h4216_analysis/5.39_rate/test/pe_h4216_test_analysis.csv
diff --git a/us/states/sc/sc_h4216_test_analysis.ipynb b/us/states/sc/h4216_analysis/5.39_rate/test/sc_h4216_test_analysis.ipynb
similarity index 87%
rename from us/states/sc/sc_h4216_test_analysis.ipynb
rename to us/states/sc/h4216_analysis/5.39_rate/test/sc_h4216_test_analysis.ipynb
index 65013a1..2f0f470 100644
--- a/us/states/sc/sc_h4216_test_analysis.ipynb
+++ b/us/states/sc/h4216_analysis/5.39_rate/test/sc_h4216_test_analysis.ipynb
@@ -404,84 +404,11 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 9,
+   "execution_count": null,
    "id": "cell-10",
    "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "====================================================================================================\n",
-      "POLICYENGINE vs RFA COMPARISON\n",
-      "====================================================================================================\n",
-      "          AGI Range PE Returns RFA Returns     PE Impact    RFA Impact         Diff\n",
-      "                $0*    727,881      78,854            $0     $-571,000    $+571,000\n",
-      "       $1 to $10000    498,186     286,253            $0    $1,655,000  $-1,655,000\n",
-      "   $10001 to $20000    233,000     310,122      $847,688    $2,872,000  $-2,024,312\n",
-      "   $20001 to $30000    171,515     275,560    $2,756,262      $769,000  $+1,987,262\n",
-      "   $30001 to $40000    157,010     269,566   $-2,140,517  $-19,360,000 $+17,219,483\n",
-      "   $40001 to $50000    132,402     234,386  $-12,807,614  $-41,986,000 $+29,178,386\n",
-      "   $50001 to $75000    245,406     407,593  $-28,577,564  $-82,146,000 $+53,568,436\n",
-      "  $75001 to $100000    165,713     250,437  $-26,753,744  $-36,461,000  $+9,707,256\n",
-      " $100001 to $150000    225,396     298,343   $49,609,656    $3,115,000 $+46,494,656\n",
-      " $150001 to $200000     42,792     143,398   $32,593,342   $50,933,000 $-18,339,658\n",
-      " $200001 to $300000     55,391     109,340   $28,205,350   $36,718,000  $-8,512,650\n",
-      " $300001 to $500000     32,748      56,123   $-8,944,396   $-4,627,000  $-4,317,396\n",
-      "$500001 to $1000000     11,418      25,664  $-21,936,012  $-16,195,000  $-5,741,012\n",
-      "      Over $1000000      6,993      11,936 $-105,563,360  $-13,767,000 $-91,796,360\n",
-      "              Total  2,705,850   2,757,573  $-92,710,912 $-119,100,000 $+26,389,088\n",
-      "====================================================================================================\n"
-     ]
-    }
-   ],
-   "source": [
-    "# Load RFA data\n",
-    "rfa_df = pd.read_csv('rfa_h4216_analysis.csv')\n",
-    "\n",
-    "def parse_dollar(val):\n",
-    "    if isinstance(val, str):\n",
-    "        return float(val.replace('$', '').replace(',', '').replace('%', ''))\n",
-    "    return val\n",
-    "\n",
-    "def parse_pct(val):\n",
-    "    if isinstance(val, str):\n",
-    "        return float(val.replace('%', ''))\n",
-    "    return val\n",
-    "\n",
-    "# Create comparison\n",
-    "comparison = []\n",
-    "for idx, pe_row in df_results.iterrows():\n",
-    "    agi_range = pe_row['Federal AGI Range']\n",
-    "    rfa_match = rfa_df[rfa_df['Federal AGI Range'] == agi_range]\n",
-    "    \n",
-    "    pe_returns = pe_row['Est # Returns']\n",
-    "    pe_impact = parse_dollar(pe_row['Total Dollar Change'])\n",
-    "    \n",
-    "    if len(rfa_match) > 0:\n",
-    "        rfa_returns = rfa_match['Est # Returns'].values[0]\n",
-    "        rfa_impact = parse_dollar(rfa_match['Total Dollar Change'].values[0])\n",
-    "    else:\n",
-    "        rfa_returns = 0\n",
-    "        rfa_impact = 0\n",
-    "    \n",
-    "    comparison.append({\n",
-    "        'AGI Range': agi_range,\n",
-    "        'PE Returns': f\"{pe_returns:,}\",\n",
-    "        'RFA Returns': f\"{rfa_returns:,}\" if rfa_returns else \"N/A\",\n",
-    "        'PE Impact': f\"${pe_impact:,.0f}\",\n",
-    "        'RFA Impact': f\"${rfa_impact:,.0f}\" if rfa_impact else \"N/A\",\n",
-    "        'Diff': f\"${pe_impact - rfa_impact:+,.0f}\" if rfa_impact else \"N/A\"\n",
-    "    })\n",
-    "\n",
-    "comparison_df = pd.DataFrame(comparison)\n",
-    "print(\"\\n\" + \"=\"*100)\n",
-    "print(\"POLICYENGINE vs RFA COMPARISON\")\n",
-    "print(\"=\"*100)\n",
-    "print(comparison_df.to_string(index=False))\n",
-    "print(\"=\"*100)"
-   ]
+   "outputs": [],
+   "source": "# Load RFA data\nrfa_df = pd.read_csv('../rfa_h4216_analysis.csv')\n\ndef parse_dollar(val):\n    if isinstance(val, str):\n        return float(val.replace('$', '').replace(',', '').replace('%', ''))\n    return val\n\ndef parse_pct(val):\n    if isinstance(val, str):\n        return float(val.replace('%', ''))\n    return val\n\n# Create comparison\ncomparison = []\nfor idx, pe_row in df_results.iterrows():\n    agi_range = pe_row['Federal AGI Range']\n    rfa_match = rfa_df[rfa_df['Federal AGI Range'] == agi_range]\n    \n    pe_returns = pe_row['Est # Returns']\n    pe_impact = parse_dollar(pe_row['Total Dollar Change'])\n    \n    if len(rfa_match) > 0:\n        rfa_returns = rfa_match['Est # Returns'].values[0]\n        rfa_impact = parse_dollar(rfa_match['Total Dollar Change'].values[0])\n    else:\n        rfa_returns = 0\n        rfa_impact = 0\n    \n    comparison.append({\n        'AGI Range': agi_range,\n        'PE Returns': f\"{pe_returns:,}\",\n        'RFA Returns': f\"{rfa_returns:,}\" if rfa_returns else \"N/A\",\n        'PE Impact': f\"${pe_impact:,.0f}\",\n        'RFA Impact': f\"${rfa_impact:,.0f}\" if rfa_impact else \"N/A\",\n        'Diff': f\"${pe_impact - rfa_impact:+,.0f}\" if rfa_impact else \"N/A\"\n    })\n\ncomparison_df = pd.DataFrame(comparison)\nprint(\"\\n\" + \"=\"*100)\nprint(\"POLICYENGINE (Test) vs RFA COMPARISON (5.39% Rate)\")\nprint(\"=\"*100)\nprint(comparison_df.to_string(index=False))\nprint(\"=\"*100)"
   },
   {
    "cell_type": "code",
@@ -548,4 +475,4 @@
  },
  "nbformat": 4,
  "nbformat_minor": 5
-}
+}
\ No newline at end of file
diff --git a/us/states/sc/h4216_analysis/h4216_analysis_comparison.md b/us/states/sc/h4216_analysis/h4216_analysis_comparison.md
new file mode 100644
index 0000000..f274508
--- /dev/null
+++ b/us/states/sc/h4216_analysis/h4216_analysis_comparison.md
@@ -0,0 +1,286 @@
+# SC H.4216 Analysis: PolicyEngine vs RFA Comparison
+
+## Executive Summary
+
+This analysis compares PolicyEngine estimates against the SC Revenue and Fiscal Affairs (RFA) fiscal notes for H.4216, a tax reform bill that restructures South Carolina's income tax system.
+
+### Budget Impact Summary
+
+| Rate Option | RFA Estimate | State Dataset | Test Dataset | State Accuracy | Test Accuracy |
+|-------------|--------------|---------------|--------------|----------------|---------------|
+| **5.21%** | **-$308.7M** | -$393.0M | -$212.0M | 73% (27% over) | 69% (31% under) |
+| **5.39%** | **-$119.1M** | -$198.2M | -$92.7M | 34% (66% over) | 78% (22% under) |
+
+**Key Finding:** The policy encoding is correct. All discrepancies stem from dataset characteristics, primarily the distribution of millionaire tax filers.
+
+---
+
+## H.4216 Reform Structure
+
+### Current SC Tax System (Baseline)
+- 0% on income up to $3,640
+- 3% on income $3,640 to $18,230
+- 6% on income over $18,230
+- Taxable income = Federal Taxable Income + SC Additions - SC Subtractions
+
+### H.4216 Reform
+- 1.99% on income up to $30,000
+- 5.21% (bill default) or 5.39% (RFA version) on income over $30,000
+- Taxable income = AGI - SC Subtractions - SCIAD (new deduction)
+- No federal standard/itemized deductions in base
+
+### SCIAD (SC Individual Adjustment Deduction)
+
+| Filing Status | Deduction | Phase-out Start | Phase-out End |
+|---------------|-----------|-----------------|---------------|
+| Single | $15,000 | $40,000 AGI | $95,000 AGI |
+| MFJ | $30,000 | $80,000 AGI | $190,000 AGI |
+| HoH | $22,500 | $60,000 AGI | $142,500 AGI |
+
+---
+
+## Dataset Comparison
+
+### Overview
+
+| Metric | RFA | State (Production) | Test |
+|--------|-----|-------------------|------|
+| **Total Returns** | 2,757,573 | 2,935,621 (+6.5%) | 2,705,850 (-1.9%) |
+| **Millionaire Returns** | 11,936 | 22,686 (+90%) | 6,993 (-41%) |
+| **Baseline Revenue** | ~$6.4B | ~$6.5B | ~$4.0B |
+| **Median HH AGI** | N/A | $43,222 | $34,927 |
+| **Avg HH AGI** | N/A | $103,858 | $74,061 |
+| **Max AGI** | N/A | $6.4M | $418.7M |
+
+### Dataset Paths
+- **State (Production):** `hf://policyengine/policyengine-us-data/states/SC.h5`
+- **Test:** `hf://policyengine/test/mar/SC.h5`
+
+---
+
+## 5.21% Rate Analysis
+
+### Budget Impact by Income Bracket
+
+| AGI Range | RFA | State | Test | State vs RFA | Test vs RFA |
+|-----------|-----|-------|------|--------------|-------------|
+| $0* | -$671K | $0 | $0 | +$671K | +$671K |
+| $1-$10K | +$1.7M | $0 | $0 | -$1.7M | -$1.7M |
+| $10K-$20K | +$2.9M | +$2.7M | +$0.8M | -$0.2M | -$2.1M |
+| $20K-$30K | +$0.8M | +$9.3M | +$2.8M | +$8.5M | +$2.0M |
+| $30K-$40K | -$19.4M | -$5.4M | -$2.1M | +$14.0M | +$17.3M |
+| $40K-$50K | -$42.6M | -$28.1M | -$12.9M | +$14.5M | +$29.7M |
+| $50K-$75K | -$89.9M | -$30.1M | -$30.5M | +$59.8M | +$59.4M |
+| $75K-$100K | -$48.6M | -$26.5M | -$31.6M | +$22.1M | +$17.0M |
+| $100K-$150K | -$26.1M | +$17.9M | +$28.5M | +$44.0M | +$54.6M |
+| $150K-$200K | +$23.8M | +$26.7M | +$24.6M | +$2.9M | +$0.8M |
+| $200K-$300K | +$4.0M | +$10.3M | +$9.6M | +$6.3M | +$5.6M |
+| $300K-$500K | -$32.1M | -$16.5M | -$26.0M | +$15.6M | +$6.1M |
+| $500K-$1M | -$37.4M | -$20.3M | -$33.2M | +$17.1M | +$4.2M |
+| **Over $1M** | **-$45.0M** | **-$332.9M** | **-$142.0M** | **-$287.9M** | **-$97.0M** |
+| **TOTAL** | **-$308.7M** | **-$393.0M** | **-$212.0M** | **-$84.3M** | **+$96.7M** |
+
+### Winner/Loser Distribution (5.21%)
+
+| Metric | RFA | State | Test |
+|--------|-----|-------|------|
+| **Tax Decrease** | 42.8% | 23.8% | 20.6% |
+| **Tax Increase** | 22.6% | 20.1% | 15.2% |
+| **No Change** | 34.6% | 56.0% | 64.2% |
+| **Total Decrease $** | -$522.1M | -$545.9M | -$345.7M |
+| **Total Increase $** | +$213.4M | +$152.9M | +$133.7M |
+
+---
+
+## 5.39% Rate Analysis
+
+### Budget Impact by Income Bracket
+
+| AGI Range | RFA | State | Test | State vs RFA | Test vs RFA |
+|-----------|-----|-------|------|--------------|-------------|
+| $0* | -$571K | $0 | $0 | +$571K | +$571K |
+| $1-$10K | +$1.7M | $0 | $0 | -$1.7M | -$1.7M |
+| $10K-$20K | +$2.9M | +$2.7M | +$0.8M | -$0.2M | -$2.1M |
+| $20K-$30K | +$0.8M | +$9.3M | +$2.8M | +$8.5M | +$2.0M |
+| $30K-$40K | -$19.4M | -$5.4M | -$2.1M | +$14.0M | +$17.3M |
+| $40K-$50K | -$42.0M | -$27.8M | -$12.8M | +$14.2M | +$29.2M |
+| $50K-$75K | -$82.1M | -$26.5M | -$28.6M | +$55.6M | +$53.5M |
+| $75K-$100K | -$36.5M | -$19.1M | -$26.8M | +$17.4M | +$9.7M |
+| $100K-$150K | +$3.1M | +$37.2M | +$49.6M | +$34.1M | +$46.5M |
+| $150K-$200K | +$50.9M | +$42.0M | +$32.6M | -$8.9M | -$18.3M |
+| $200K-$300K | +$36.7M | +$26.7M | +$28.2M | -$10.0M | -$8.5M |
+| $300K-$500K | -$4.6M | +$4.3M | -$8.9M | +$8.9M | -$4.3M |
+| $500K-$1M | -$16.2M | -$6.4M | -$21.9M | +$9.8M | -$5.7M |
+| **Over $1M** | **-$13.8M** | **-$235.2M** | **-$105.6M** | **-$221.4M** | **-$91.8M** |
+| **TOTAL** | **-$119.1M** | **-$198.2M** | **-$92.7M** | **-$79.1M** | **+$26.4M** |
+
+### Winner/Loser Distribution (5.39%)
+
+| Metric | RFA | State | Test |
+|--------|-----|-------|------|
+| **Tax Decrease** | 38.7% | 21.5% | 18.3% |
+| **Tax Increase** | 26.7% | 22.5% | 17.6% |
+| **No Change** | 34.6% | 56.0% | 64.1% |
+| **Total Decrease $** | -$388.7M | -$396.2M | -$259.2M |
+| **Total Increase $** | +$269.6M | +$197.9M | +$166.5M |
+
+---
+
+## Root Cause Analysis
+
+### 1. Millionaire Distribution (Primary Driver)
+
+The millionaire bracket (>$1M AGI) is the dominant driver of discrepancies:
+
+| Metric | RFA | State | Test |
+|--------|-----|-------|------|
+| **Millionaire Count** | 11,936 | 22,686 (+90%) | 6,993 (-41%) |
+| **5.21% Impact** | -$45.0M | -$332.9M | -$142.0M |
+| **5.39% Impact** | -$13.8M | -$235.2M | -$105.6M |
+| **Avg Change (5.21%)** | -$4,031 | -$14,672 | -$20,306 |
+
+**State Dataset:** Has nearly **double** the millionaires RFA reports. This alone accounts for ~$288M of the $84M overestimate at 5.21%.
+
+**Test Dataset:** Has 41% fewer millionaires but an extreme outlier ($418.7M AGI) that skews averages significantly.
+
+### 2. Middle-Income Brackets ($30K-$100K)
+
+RFA shows much larger tax cuts in middle-income brackets:
+
+| Bracket Range | RFA Impact | State Impact | Test Impact |
+|---------------|------------|--------------|-------------|
+| $30K-$100K combined | -$200.5M | -$90.1M | -$77.1M |
+| Difference vs RFA | - | +$110.4M | +$123.4M |
+
+Both PE datasets underweight middle-income filers relative to RFA.
+
+### 3. Upper-Middle Income ($100K-$300K)
+
+PE shows tax **increases** where RFA shows mixed results:
+
+| Bracket Range | RFA Impact | State Impact | Test Impact |
+|---------------|------------|--------------|-------------|
+| $100K-$300K (5.21%) | -$22.1M | +$54.9M | +$62.7M |
+| $100K-$300K (5.39%) | +$90.7M | +$105.9M | +$110.4M |
+
+This suggests SCIAD phase-out behavior may differ or income distributions within brackets vary.
+
+### 4. Low-Income Brackets ($0-$30K)
+
+| Bracket | RFA Returns | State Returns | Test Returns |
+|---------|-------------|---------------|--------------|
+| $0* | 78,854 (2.9%) | 619,010 (21.1%) | 727,881 (26.9%) |
+| $1-$10K | 286,253 (10.4%) | 502,276 (17.1%) | 498,186 (18.4%) |
+
+PE datasets have significantly more zero/low-income tax units. These units have zero tax liability, so they don't affect budget impact but dilute the "% with tax change" statistics.
+
+---
+
+## Summary of Dataset Characteristics
+
+### State (Production) Dataset
+- **Overestimates** tax cuts at both rates
+- Has 90% more millionaires than RFA
+- Higher average incomes ($104K vs $74K Test)
+- Baseline revenue matches RFA (~$6.5B)
+- More total returns than RFA (+6.5%)
+
+### Test Dataset
+- **Underestimates** tax cuts at both rates
+- Has 41% fewer millionaires than RFA
+- Lower average incomes ($74K)
+- Baseline revenue 37% below RFA ($4.0B vs $6.4B)
+- Return count close to RFA (-1.9%)
+- Has extreme outlier ($418.7M AGI)
+
+### Ideal Dataset Would Have
+- RFA's millionaire count (~11,936)
+- RFA's return count (~2.76M)
+- RFA's baseline revenue (~$6.4B)
+- Middle-income weighting matching SC tax filer data
+
+---
+
+## Recommendations
+
+### For Data Team
+1. Investigate millionaire overcount in State dataset (22,686 vs 11,936 RFA)
+2. Investigate baseline revenue undercount in Test dataset ($4.0B vs $6.4B)
+3. Recalibrate weights to match SC DOR filer distribution by income bracket
+4. Validate against IRS SOI data for SC
+
+### For Analysis
+1. Report range of estimates from both datasets
+2. Use State for directional analysis (correct baseline revenue magnitude)
+3. Use Test for return count validation (closer to RFA)
+4. Note millionaire bracket as primary source of uncertainty
+
+### For Reporting
+| Rate | Conservative | Central | Aggressive |
+|------|--------------|---------|------------|
+| 5.21% | -$212M (Test) | -$309M (RFA) | -$393M (State) |
+| 5.39% | -$93M (Test) | -$119M (RFA) | -$198M (State) |
+
+---
+
+## File Structure
+
+```
+sc/
+├── data_exploration.ipynb              # State dataset exploration
+├── data_exploration_test.ipynb         # Test dataset exploration
+├── sc_dataset_summary_weighted.csv     # State dataset summary stats
+├── sc_test_dataset_summary_weighted.csv # Test dataset summary stats
+└── h4216_analysis/
+    ├── h4216_analysis_comparison.md    # This file
+    ├── 5.21_rate/
+    │   ├── rfa_h4216_5.21_analysis.csv # RFA fiscal note data
+    │   ├── state/
+    │   │   ├── pe_h4216_5.21_state_analysis.csv
+    │   │   └── sc_h4216_5.21_state_analysis.ipynb
+    │   └── test/
+    │       ├── pe_h4216_5.21_analysis.csv
+    │       └── sc_h4216_5.21_analysis.ipynb
+    └── 5.39_rate/
+        ├── rfa_h4216_analysis.csv      # RFA fiscal note data
+        ├── state/
+        │   ├── pe_h4216_5.39_state_analysis.csv
+        │   └── sc_h4216_5.39_state_analysis.ipynb
+        └── test/
+            ├── pe_h4216_test_analysis.csv
+            └── sc_h4216_test_analysis.ipynb
+```
+
+---
+
+## Technical Notes
+
+### PR #7514 Fix (February 2025)
+
+Fixed bug where `sc_additions` (QBI and SALT addbacks) were incorrectly applied under H.4216. Since H.4216 starts from AGI (before federal deductions), addbacks are inappropriate.
+
+- **Before fix:** +$39.8M (wrong direction - showed revenue increase)
+- **After fix:** -$93M to -$393M depending on dataset and rate
+
+### Policy Parameters Location
+```
+policyengine-us/policyengine_us/parameters/gov/contrib/states/sc/h4216/
+```
+
+### Microsimulation Usage
+```python
+from policyengine_us import Microsimulation
+from policyengine_us.reforms.states.sc.h4216.sc_h4216 import create_sc_h4216
+from policyengine_core.reforms import Reform
+
+# Create reform with specific top rate
+param_reform = Reform.from_dict({
+    "gov.contrib.states.sc.h4216.in_effect": {"2026-01-01.2100-12-31": True},
+    "gov.contrib.states.sc.h4216.rates[1].rate": {"2026-01-01.2100-12-31": 0.0521}
+}, country_id="us")
+
+base_reform = create_sc_h4216()
+reform = (base_reform, param_reform)
+
+sim = Microsimulation(dataset="hf://policyengine/test/mar/SC.h5", reform=reform)
+```
diff --git a/us/states/sc/h4216_analysis_comparison.md b/us/states/sc/h4216_analysis_comparison.md
deleted file mode 100644
index 3728b32..0000000
--- a/us/states/sc/h4216_analysis_comparison.md
+++ /dev/null
@@ -1,174 +0,0 @@
-# SC H.4216 Analysis Comparison: PolicyEngine vs RFA
-
-## Executive Summary
-
-**UPDATE (March 2025):** After PR #7514 fix and testing multiple datasets:
-
-| Dataset | 5.21% Impact | vs RFA (-$309M) | 5.39% Impact | vs RFA (-$119M) |
-|---------|--------------|-----------------|--------------|-----------------|
-| **Production** | -$393M | 73% accuracy | -$198M | 34% accuracy |
-| **Test (Mar)** | -$212M | 69% accuracy | -$93M | 78% accuracy |
-| **RFA** | -$309M | - | -$119M | - |
-
-**Key Finding:** Neither dataset consistently matches RFA. Production overestimates cuts, Test underestimates them. The core issue is baseline revenue calibration.
-
----
-
-## Dataset Comparison
-
-### Overview
-
-| Metric | Production | Test | RFA |
-|--------|------------|------|-----|
-| **Tax Units** | 2,935,621 | 2,705,850 | 2,757,573 |
-| **Baseline Revenue** | $6.5B | $4.0B | ~$6.4B |
-| **Median HH AGI** | $43,222 | $34,927 | N/A |
-| **Avg HH AGI** | $103,858 | $74,061 | N/A |
-| **25th Percentile AGI** | $9,425 | $2,489 | N/A |
-| **Max AGI** | $6.4M | $418.7M | N/A |
-
-### Budget Impact Comparison
-
-| Rate | Production | Test | RFA | Best Match |
-|------|------------|------|-----|------------|
-| **5.21%** | -$393M | -$212M | -$309M | Production (73%) |
-| **5.39%** | -$198M | -$93M | -$119M | Test (78%) |
-
----
-
-## Why Production OVERESTIMATES
-
-Production estimates -$198M vs RFA's -$119M at 5.39% rate (**67% over**)
-
-### 1. Higher Average Incomes
-- Production median AGI: **$43,222** vs Test $34,927
-- Production avg AGI: **$103,858** vs Test $74,061
-- More high earners = larger tax cuts when rates drop
-
-### 2. Higher Baseline Revenue
-- Production: **$6.5B** baseline revenue
-- Test: $4.0B baseline revenue
-- Production has **63% more** baseline revenue than Test
-- Bigger revenue base = bigger absolute cuts
-
-### 3. More Tax Units Than RFA
-- Production: 2,935,621 tax units
-- RFA: 2,757,573 filers
-- **+178,048 extra units** (6.5% more)
-- Includes non-filers with imputed income
-
-### 4. Fewer Low-Income Units
-- Production 25th percentile: **$9,425**
-- Test 25th percentile: $2,489
-- Production has fewer truly low-income/zero-tax units
-- More taxpayers affected by rate changes
-
----
-
-## Why Test UNDERESTIMATES
-
-Test estimates -$93M vs RFA's -$119M at 5.39% rate (**22% under**)
-
-### 1. Lower Baseline Revenue
-- Test: **$4.0B** baseline revenue
-- RFA: ~$6.4B estimated baseline
-- Test has **37% less** revenue than RFA
-- Smaller revenue base = smaller absolute cuts
-
-### 2. Lower Average Incomes
-- Test avg AGI: **$74,061** vs Production $103,858
-- Fewer high-income taxpayers paying significant taxes
-- Smaller tax liabilities to cut
-
-### 3. Extreme Outlier at Top
-- Test max AGI: **$418.7M** (single household)
-- Production max: $6.4M
-- One extreme outlier may distort millionaire calculations
-- Could skew average tax calculations
-
-### 4. More Low-Income Units
-- Test 25th percentile AGI: **$2,489**
-- Production 25th percentile: $9,425
-- More zero-tax units diluting the weighted averages
-- More units unaffected by rate changes
-
----
-
-## The Core Issue: Baseline Revenue Calibration
-
-| Source | Baseline Revenue | vs RFA |
-|--------|------------------|--------|
-| **RFA** | ~$6.4B | - |
-| **Production** | $6.5B | **+2%** |
-| **Test** | $4.0B | **-37%** |
-
-### What Each Dataset Gets Right/Wrong
-
-**Production Dataset:**
-- ✅ Matches RFA baseline revenue (~$6.5B)
-- ❌ Wrong income distribution (too many high earners)
-- ❌ Overestimates tax cuts at all rates
-
-**Test Dataset:**
-- ✅ Better return count (2.71M vs 2.76M RFA)
-- ❌ Severely underestimates baseline revenue ($4B vs $6.4B)
-- ❌ Underestimates tax cuts at all rates
-
-### Ideal Dataset Would Have:
-- Test's return count (~2.7M matching RFA's 2.76M filers)
-- Production's baseline revenue (~$6.5B matching RFA's ~$6.4B)
-- RFA's millionaire distribution (11,936 returns over $1M)
-
----
-
-## Technical Details
-
-### PR #7514 Fix (February 2025)
-
-Fixed bug where `sc_additions` (QBI and SALT addbacks) were incorrectly applied under H.4216. Since H.4216 starts from AGI (before federal deductions), addbacks are inappropriate.
-
-**Before fix:** +$39.8M (wrong direction)
-**After fix:** -$93M to -$198M depending on dataset
-
-### H.4216 Reform Structure
-
-**Baseline SC Taxable Income:**
-```
-taxable_income = federal_taxable_income + sc_additions - sc_subtractions
-```
-
-**H.4216 SC Taxable Income:**
-```
-taxable_income = AGI - sc_subtractions - SCIAD
-```
-
-**Rate Structure:**
-- Current: 0% up to $3,640, 3% $3,640-$18,230, 6% over $18,230
-- H.4216: 1.99% up to $30,000, 5.21%/5.39% over $30,000
-
-### SCIAD Phase-out
-
-| Filing Status | Amount | Phase-out Start | Phase-out End |
-|---------------|--------|-----------------|---------------|
-| Single | $15,000 | $40,000 | $95,000 |
-| MFJ | $30,000 | $80,000 | $190,000 |
-| HoH | $22,500 | $60,000 | $142,500 |
-
----
-
-## Recommendations
-
-### For Data Team:
-1. Investigate why Test dataset has only $4B baseline revenue vs $6.4B actual
-2. Recalibrate weights to match SC tax filer distribution
-3. Validate millionaire counts against IRS SOI data
-
-### For Analysis:
-1. Use Production for directional analysis (correct baseline revenue)
-2. Use Test for return count validation (closer to RFA filer count)
-3. Report range of estimates: -$93M to -$198M for 5.39% rate
-
-### For Reporting:
-- RFA 5.39% estimate: **-$119.1M**
-- RFA 5.21% estimate: **-$309.0M**
-- PE best estimates: **-$93M to -$198M** (5.39%), **-$212M to -$393M** (5.21%)
diff --git a/us/states/sc/sc_h4216_budget_impact.py b/us/states/sc/sc_h4216_budget_impact.py
deleted file mode 100644
index bf80b03..0000000
--- a/us/states/sc/sc_h4216_budget_impact.py
+++ /dev/null
@@ -1,68 +0,0 @@
-"""
-SC H.4216 Budget Impact Analysis
-Simple script to calculate the budgetary impact of H.4216 with default 5.21% top rate.
-"""
-
-from policyengine_us import Microsimulation
-from policyengine_us.reforms.states.sc.h4216.sc_h4216 import create_sc_h4216
-from policyengine_core.reforms import Reform
-import numpy as np
-
-SC_DATASET = "hf://policyengine/test/mar/SC.h5"
-TAX_YEAR = 2026
-
-def create_h4216_reform():
-    """
-    SC H.4216 Reform with default rates:
-    - 1.99% up to $30k
-    - 5.21% over $30k (default)
-    """
-    param_reform = Reform.from_dict(
-        {
-            "gov.contrib.states.sc.h4216.in_effect": {
-                "2026-01-01.2100-12-31": True
-            }
-        },
-        country_id="us",
-    )
-    base_reform = create_sc_h4216()
-    return (base_reform, param_reform)
-
-print("Loading baseline...")
-baseline = Microsimulation(dataset=SC_DATASET)
-
-print("Loading reform (H.4216 with 5.21% top rate)...")
-reform = create_h4216_reform()
-reform_sim = Microsimulation(dataset=SC_DATASET, reform=reform)
-
-# Calculate tax impact - use .values to get raw numpy arrays (avoid MicroSeries auto-weighting)
-baseline_tax = baseline.calculate("sc_income_tax", period=TAX_YEAR, map_to="tax_unit").values
-reform_tax = reform_sim.calculate("sc_income_tax", period=TAX_YEAR, map_to="tax_unit").values
-weight = baseline.calculate("tax_unit_weight", period=TAX_YEAR).values
-
-tax_change = reform_tax - baseline_tax
-budget_impact = (tax_change * weight).sum()
-
-# Summary stats (all using raw numpy arrays, no MicroSeries)
-baseline_revenue = (baseline_tax * weight).sum()
-reform_revenue = (reform_tax * weight).sum()
-total_weight = weight.sum()
-
-pct_decrease = weight[tax_change < -1].sum() / total_weight * 100
-pct_increase = weight[tax_change > 1].sum() / total_weight * 100
-pct_unchanged = weight[np.abs(tax_change) <= 1].sum() / total_weight * 100
-
-print("\n" + "="*60)
-print("SC H.4216 BUDGET IMPACT (5.21% Top Rate)")
-print("="*60)
-print(f"\nBaseline SC Income Tax Revenue: ${baseline_revenue:,.0f}")
-print(f"Reform SC Income Tax Revenue:   ${reform_revenue:,.0f}")
-print(f"\n>>> BUDGET IMPACT: ${budget_impact:,.0f} <<<")
-print(f"\nRFA Estimate (5.21%): -$309,000,000")
-print(f"Difference from RFA: ${budget_impact - (-309000000):,.0f}")
-print(f"Accuracy: {(1 - abs(budget_impact - (-309000000)) / 309000000) * 100:.1f}%")
-print("\n" + "-"*60)
-print(f"Tax units with DECREASE: {pct_decrease:.1f}%")
-print(f"Tax units with INCREASE: {pct_increase:.1f}%")
-print(f"Tax units UNCHANGED:     {pct_unchanged:.1f}%")
-print("="*60)
diff --git a/us/states/sc/sc_h4216_dataset_comparison.py b/us/states/sc/sc_h4216_dataset_comparison.py
deleted file mode 100644
index da89d35..0000000
--- a/us/states/sc/sc_h4216_dataset_comparison.py
+++ /dev/null
@@ -1,92 +0,0 @@
-"""
-SC H.4216 Budget Impact Comparison Across Datasets
-Compares budgetary impacts using production, staging, and test datasets.
-"""
-
-from policyengine_us import Microsimulation
-from policyengine_us.reforms.states.sc.h4216.sc_h4216 import create_sc_h4216
-from policyengine_core.reforms import Reform
-import numpy as np
-
-TAX_YEAR = 2026
-
-DATASETS = {
-    "Production": "hf://policyengine/policyengine-us-data/states/SC.h5",
-    "Test (Mar)": "hf://policyengine/test/mar/SC.h5"
-}
-
-def create_h4216_reform(top_rate=0.0521):
-    param_reform = Reform.from_dict(
-        {
-            "gov.contrib.states.sc.h4216.in_effect": {
-                "2026-01-01.2100-12-31": True
-            },
-            "gov.contrib.states.sc.h4216.rates[1].rate": {
-                "2026-01-01.2100-12-31": top_rate
-            }
-        },
-        country_id="us",
-    )
-    base_reform = create_sc_h4216()
-    return (base_reform, param_reform)
-
-def calculate_impact(dataset_path, top_rate):
-    """Calculate budget impact for a given dataset and top rate."""
-    baseline = Microsimulation(dataset=dataset_path)
-    reform = create_h4216_reform(top_rate=top_rate)
-    reform_sim = Microsimulation(dataset=dataset_path, reform=reform)
-
-    baseline_tax = baseline.calculate("sc_income_tax", period=TAX_YEAR, map_to="tax_unit").values
-    reform_tax = reform_sim.calculate("sc_income_tax", period=TAX_YEAR, map_to="tax_unit").values
-    weight = baseline.calculate("tax_unit_weight", period=TAX_YEAR).values
-
-    tax_change = reform_tax - baseline_tax
-    budget_impact = (tax_change * weight).sum()
-    total_units = weight.sum()
-    baseline_revenue = (baseline_tax * weight).sum()
-
-    return {
-        "budget_impact": budget_impact,
-        "total_units": total_units,
-        "baseline_revenue": baseline_revenue
-    }
-
-# Run analysis
-results = {}
-for name, path in DATASETS.items():
-    print(f"\nProcessing {name}...")
-    results[name] = {
-        "5.21%": calculate_impact(path, 0.0521),
-        "5.39%": calculate_impact(path, 0.0539)
-    }
-    print(f"  Done!")
-
-# Print results
-print("\n" + "="*90)
-print("SC H.4216 BUDGET IMPACT COMPARISON ACROSS DATASETS")
-print("="*90)
-
-print(f"\n{'Dataset':<15} {'Tax Units':>15} {'Baseline Rev':>18} {'5.21% Impact':>18} {'5.39% Impact':>18}")
-print("-"*90)
-
-for name in DATASETS.keys():
-    r = results[name]
-    print(f"{name:<15} {r['5.21%']['total_units']:>15,.0f} ${r['5.21%']['baseline_revenue']:>16,.0f} ${r['5.21%']['budget_impact']:>16,.0f} ${r['5.39%']['budget_impact']:>16,.0f}")
-
-print("-"*90)
-print(f"{'RFA Estimate':<15} {'2,757,573':>15} {'N/A':>18} ${-309000000:>16,.0f} ${-119100000:>16,.0f}")
-print("="*90)
-
-# Accuracy comparison
-print("\n" + "="*90)
-print("ACCURACY vs RFA")
-print("="*90)
-print(f"{'Dataset':<15} {'5.21% PE':>15} {'vs RFA -$309M':>18} {'5.39% PE':>15} {'vs RFA -$119M':>18}")
-print("-"*90)
-for name in DATASETS.keys():
-    impact_521 = results[name]["5.21%"]["budget_impact"]
-    impact_539 = results[name]["5.39%"]["budget_impact"]
-    acc_521 = (1 - abs(impact_521 - (-309000000)) / 309000000) * 100
-    acc_539 = (1 - abs(impact_539 - (-119100000)) / 119100000) * 100
-    print(f"{name:<15} ${impact_521:>14,.0f} {acc_521:>16.1f}% ${impact_539:>14,.0f} {acc_539:>16.1f}%")
-print("="*90)
diff --git a/us/states/sc/sc_h4216_reform_analysis.ipynb b/us/states/sc/sc_h4216_reform_analysis.ipynb
deleted file mode 100644
index 5d8bf26..0000000
--- a/us/states/sc/sc_h4216_reform_analysis.ipynb
+++ /dev/null
@@ -1,831 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# South Carolina H.4216 Tax Reform Analysis (Tax Year 2026)\n",
-    "\n",
-    "This notebook analyzes the impact of SC H.4216 tax reform.\n",
-    "\n",
-    "## Proposal\n",
-    "- Apply a tax rate of 1.99% on taxable income up to $30,000 and 5.39% over\n",
-    "- Eliminate the federal standard or itemized deduction\n",
-    "- Allow a new SC Income Adjusted Deduction (SCIAD) at certain income levels\n",
-    "- Maintain all other state adjustments, exemptions, and credits\n",
-    "- Cap SC EITC at $200\n",
-    "\n",
-    "## Current 2026 Marginal Tax Rates\n",
-    "- 0% up to $3,640\n",
-    "- 3% $3,640 - $18,230\n",
-    "- 6% over $18,230\n",
-    "\n",
-    "## Proposed Tax Rates\n",
-    "- 1.99% up to $30,000\n",
-    "- 5.39% over $30,000\n",
-    "\n",
-    "## SC Deduction (SCIAD) Phase-out\n",
-    "| Filing Status | Amount | Phase-out Start | Phase-out End |\n",
-    "|---------------|--------|-----------------|---------------|\n",
-    "| Single | $15,000 | $40,000 | $95,000 |\n",
-    "| Married Joint | $30,000 | $80,000 | $190,000 |\n",
-    "| Head of Household | $22,500 | $60,000 | $142,500 |\n",
-    "\n",
-    "## Implementation Note\n",
-    "This analysis uses the corrected H.4216 implementation (PR #7514) which properly handles SC additions.\n",
-    "The fix removes `sc_additions` from the H.4216 taxable income formula since H.4216 starts from AGI\n",
-    "(before federal deductions), making addbacks for QBI and SALT inappropriate."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": "from policyengine_us import Microsimulation\nfrom policyengine_us.reforms.states.sc.h4216.sc_h4216 import create_sc_h4216\nfrom policyengine_core.reforms import Reform\nimport pandas as pd\nimport numpy as np\n\nSC_DATASET = \"hf://policyengine/test/mar/SC.h5\"\nTAX_YEAR = 2026  # Renamed to avoid conflict with YEAR constant from model_api"
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 2,
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Reform function defined!\n"
-     ]
-    }
-   ],
-   "source": [
-    "from policyengine_us.model_api import *\n",
-    "\n",
-    "def create_h4216_reform():\n",
-    "    \"\"\"\n",
-    "    SC H.4216 Reform:\n",
-    "    - Enable H.4216 via in_effect parameter\n",
-    "    - Set rates: 1.99% up to $30k, 5.39% over $30k\n",
-    "    \"\"\"\n",
-    "    # Parameter changes via Reform.from_dict\n",
-    "    param_reform = Reform.from_dict(\n",
-    "        {\n",
-    "            \"gov.contrib.states.sc.h4216.in_effect\": {\n",
-    "                \"2026-01-01.2100-12-31\": True\n",
-    "            },\n",
-    "            \"gov.contrib.states.sc.h4216.rates[1].rate\": {\n",
-    "                \"2026-01-01.2100-12-31\": 0.0539\n",
-    "            }\n",
-    "        },\n",
-    "        country_id=\"us\",\n",
-    "    )\n",
-    "    \n",
-    "    # Get base H.4216 reform (EITC cap, SCIAD, taxable income, tax calculation)\n",
-    "    base_reform = create_sc_h4216()\n",
-    "    \n",
-    "    # Order: base reform first, then parameter overrides\n",
-    "    return (base_reform, param_reform)\n",
-    "\n",
-    "print(\"Reform function defined!\")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 3,
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Loading baseline (current SC tax law)...\n"
-     ]
-    },
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "Xet Storage is enabled for this repo, but the 'hf_xet' package is not installed. Falling back to regular HTTP download. For better performance, install the package with: `pip install huggingface_hub[hf_xet]` or `pip install hf_xet`\n"
-     ]
-    },
-    {
-     "data": {
-      "application/vnd.jupyter.widget-view+json": {
-       "model_id": "eddcbb760af5468b94382e107443581b",
-       "version_major": 2,
-       "version_minor": 0
-      },
-      "text/plain": [
-       "SC.h5:   0%|          | 0.00/52.8M [00:00<?, ?B/s]"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Baseline loaded\n",
-      "\n",
-      "Loading reform (H.4216 with 5.39% top rate)...\n",
-      "Reform loaded\n",
-      "\n",
-      "============================================================\n",
-      "All simulations ready!\n",
-      "============================================================\n"
-     ]
-    }
-   ],
-   "source": [
-    "print(\"Loading baseline (current SC tax law)...\")\n",
-    "baseline = Microsimulation(dataset=SC_DATASET)\n",
-    "print(\"Baseline loaded\")\n",
-    "\n",
-    "print(\"\\nLoading reform (H.4216 with 5.39% top rate)...\")\n",
-    "reform = create_h4216_reform()\n",
-    "reform_sim = Microsimulation(dataset=SC_DATASET, reform=reform)\n",
-    "print(\"Reform loaded\")\n",
-    "\n",
-    "print(\"\\n\" + \"=\"*60)\n",
-    "print(\"All simulations ready!\")\n",
-    "print(\"=\"*60)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "## Calculate Tax Impacts by Income Bracket"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 4,
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Total tax units: 48,461\n",
-      "Weighted tax units (returns): 3,204,719\n"
-     ]
-    }
-   ],
-   "source": [
-    "# Get tax unit level data\n",
-    "baseline_tax = np.array(baseline.calculate(\"sc_income_tax\", period=TAX_YEAR, map_to=\"tax_unit\"))\n",
-    "reform_tax = np.array(reform_sim.calculate(\"sc_income_tax\", period=TAX_YEAR, map_to=\"tax_unit\"))\n",
-    "agi = np.array(baseline.calculate(\"adjusted_gross_income\", period=TAX_YEAR, map_to=\"tax_unit\"))\n",
-    "tax_unit_weight = np.array(baseline.calculate(\"tax_unit_weight\", period=TAX_YEAR))\n",
-    "\n",
-    "# Calculate tax change\n",
-    "tax_change = reform_tax - baseline_tax\n",
-    "\n",
-    "print(f\"Total tax units: {len(baseline_tax):,}\")\n",
-    "print(f\"Weighted tax units (returns): {tax_unit_weight.sum():,.0f}\")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 5,
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Results calculated!\n"
-     ]
-    }
-   ],
-   "source": [
-    "# Define income brackets matching the RFA analysis\n",
-    "income_brackets = [\n",
-    "    (float('-inf'), 0, \"$0*\"),\n",
-    "    (0, 10000, \"$1 to $10,000\"),\n",
-    "    (10000, 20000, \"$10,001 to $20,000\"),\n",
-    "    (20000, 30000, \"$20,001 to $30,000\"),\n",
-    "    (30000, 40000, \"$30,001 to $40,000\"),\n",
-    "    (40000, 50000, \"$40,001 to $50,000\"),\n",
-    "    (50000, 75000, \"$50,001 to $75,000\"),\n",
-    "    (75000, 100000, \"$75,001 to $100,000\"),\n",
-    "    (100000, 150000, \"$100,001 to $150,000\"),\n",
-    "    (150000, 200000, \"$150,001 to $200,000\"),\n",
-    "    (200000, 300000, \"$200,001 to $300,000\"),\n",
-    "    (300000, 500000, \"$300,001 to $500,000\"),\n",
-    "    (500000, 1000000, \"$500,001 to $1,000,000\"),\n",
-    "    (1000000, float('inf'), \"Over $1,000,000\")\n",
-    "]\n",
-    "\n",
-    "results = []\n",
-    "\n",
-    "for lower, upper, label in income_brackets:\n",
-    "    if lower == float('-inf'):\n",
-    "        mask = agi <= upper\n",
-    "    elif upper == float('inf'):\n",
-    "        mask = agi > lower\n",
-    "    else:\n",
-    "        mask = (agi > lower) & (agi <= upper)\n",
-    "    \n",
-    "    if mask.sum() == 0:\n",
-    "        continue\n",
-    "    \n",
-    "    # Weighted counts\n",
-    "    est_returns = tax_unit_weight[mask].sum()\n",
-    "    pct_returns = est_returns / tax_unit_weight.sum() * 100\n",
-    "    \n",
-    "    # Tax liability\n",
-    "    old_avg_tax = np.average(baseline_tax[mask], weights=tax_unit_weight[mask]) if est_returns > 0 else 0\n",
-    "    new_avg_tax = np.average(reform_tax[mask], weights=tax_unit_weight[mask]) if est_returns > 0 else 0\n",
-    "    \n",
-    "    # Returns with tax change (threshold of $1)\n",
-    "    change_mask = mask & (np.abs(tax_change) > 1)\n",
-    "    returns_with_change = tax_unit_weight[change_mask].sum()\n",
-    "    pct_with_change = returns_with_change / est_returns * 100 if est_returns > 0 else 0\n",
-    "    \n",
-    "    if returns_with_change > 0:\n",
-    "        old_avg_tax_changed = np.average(baseline_tax[change_mask], weights=tax_unit_weight[change_mask])\n",
-    "        new_avg_tax_changed = np.average(reform_tax[change_mask], weights=tax_unit_weight[change_mask])\n",
-    "        avg_change = new_avg_tax_changed - old_avg_tax_changed\n",
-    "    else:\n",
-    "        old_avg_tax_changed = 0\n",
-    "        new_avg_tax_changed = 0\n",
-    "        avg_change = 0\n",
-    "    \n",
-    "    total_change = (tax_change[mask] * tax_unit_weight[mask]).sum()\n",
-    "    \n",
-    "    # Tax decrease\n",
-    "    decrease_mask = mask & (tax_change < -1)\n",
-    "    decrease_returns = tax_unit_weight[decrease_mask].sum()\n",
-    "    decrease_pct = decrease_returns / est_returns * 100 if est_returns > 0 else 0\n",
-    "    total_decrease = (tax_change[decrease_mask] * tax_unit_weight[decrease_mask]).sum() if decrease_returns > 0 else 0\n",
-    "    avg_decrease = np.average(tax_change[decrease_mask], weights=tax_unit_weight[decrease_mask]) if decrease_returns > 0 else 0\n",
-    "    \n",
-    "    # Tax increase\n",
-    "    increase_mask = mask & (tax_change > 1)\n",
-    "    increase_returns = tax_unit_weight[increase_mask].sum()\n",
-    "    increase_pct = increase_returns / est_returns * 100 if est_returns > 0 else 0\n",
-    "    total_increase = (tax_change[increase_mask] * tax_unit_weight[increase_mask]).sum() if increase_returns > 0 else 0\n",
-    "    avg_increase = np.average(tax_change[increase_mask], weights=tax_unit_weight[increase_mask]) if increase_returns > 0 else 0\n",
-    "    \n",
-    "    # No change\n",
-    "    no_change_mask = mask & (np.abs(tax_change) <= 1)\n",
-    "    no_change_returns = tax_unit_weight[no_change_mask].sum()\n",
-    "    no_change_pct = no_change_returns / est_returns * 100 if est_returns > 0 else 0\n",
-    "    \n",
-    "    # Zero tax liability (under reform)\n",
-    "    zero_tax_mask = mask & (reform_tax <= 0)\n",
-    "    zero_tax_returns = tax_unit_weight[zero_tax_mask].sum()\n",
-    "    zero_tax_pct = zero_tax_returns / est_returns * 100 if est_returns > 0 else 0\n",
-    "    \n",
-    "    results.append({\n",
-    "        \"Federal AGI Range\": label,\n",
-    "        \"Est. # Returns\": int(round(est_returns)),\n",
-    "        \"% of Returns\": round(pct_returns, 1),\n",
-    "        \"Old Avg Tax\": int(round(old_avg_tax)),\n",
-    "        \"New Avg Tax\": int(round(new_avg_tax)),\n",
-    "        \"Returns w/ Change\": int(round(returns_with_change)),\n",
-    "        \"% w/ Change\": round(pct_with_change, 1),\n",
-    "        \"Avg Change\": int(round(avg_change)),\n",
-    "        \"Total Change ($)\": int(round(total_change)),\n",
-    "        \"Decrease #\": int(round(decrease_returns)),\n",
-    "        \"Decrease %\": round(decrease_pct, 1),\n",
-    "        \"Total Decrease ($)\": int(round(total_decrease)),\n",
-    "        \"Avg Decrease\": int(round(avg_decrease)),\n",
-    "        \"Increase #\": int(round(increase_returns)),\n",
-    "        \"Increase %\": round(increase_pct, 1),\n",
-    "        \"Total Increase ($)\": int(round(total_increase)),\n",
-    "        \"Avg Increase\": int(round(avg_increase)),\n",
-    "        \"No Change #\": int(round(no_change_returns)),\n",
-    "        \"No Change %\": round(no_change_pct, 1),\n",
-    "        \"Zero Tax #\": int(round(zero_tax_returns)),\n",
-    "        \"Zero Tax %\": round(zero_tax_pct, 1)\n",
-    "    })\n",
-    "\n",
-    "df_results = pd.DataFrame(results)\n",
-    "print(\"Results calculated!\")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 6,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Calculate totals\n",
-    "total_returns = tax_unit_weight.sum()\n",
-    "total_old_tax = np.average(baseline_tax, weights=tax_unit_weight)\n",
-    "total_new_tax = np.average(reform_tax, weights=tax_unit_weight)\n",
-    "\n",
-    "change_mask_all = np.abs(tax_change) > 1\n",
-    "total_returns_changed = tax_unit_weight[change_mask_all].sum()\n",
-    "total_change_amount = (tax_change * tax_unit_weight).sum()\n",
-    "\n",
-    "decrease_mask_all = tax_change < -1\n",
-    "total_decrease_returns = tax_unit_weight[decrease_mask_all].sum()\n",
-    "total_decrease_amount = (tax_change[decrease_mask_all] * tax_unit_weight[decrease_mask_all]).sum()\n",
-    "\n",
-    "increase_mask_all = tax_change > 1\n",
-    "total_increase_returns = tax_unit_weight[increase_mask_all].sum()\n",
-    "total_increase_amount = (tax_change[increase_mask_all] * tax_unit_weight[increase_mask_all]).sum()\n",
-    "\n",
-    "no_change_mask_all = np.abs(tax_change) <= 1\n",
-    "total_no_change_returns = tax_unit_weight[no_change_mask_all].sum()\n",
-    "\n",
-    "zero_tax_mask_all = reform_tax <= 0\n",
-    "total_zero_tax_returns = tax_unit_weight[zero_tax_mask_all].sum()\n",
-    "\n",
-    "# Add totals row\n",
-    "totals = {\n",
-    "    \"Federal AGI Range\": \"Total\",\n",
-    "    \"Est. # Returns\": int(round(total_returns)),\n",
-    "    \"% of Returns\": 100.0,\n",
-    "    \"Old Avg Tax\": int(round(total_old_tax)),\n",
-    "    \"New Avg Tax\": int(round(total_new_tax)),\n",
-    "    \"Returns w/ Change\": int(round(total_returns_changed)),\n",
-    "    \"% w/ Change\": round(total_returns_changed / total_returns * 100, 1),\n",
-    "    \"Avg Change\": int(round(total_new_tax - total_old_tax)),\n",
-    "    \"Total Change ($)\": int(round(total_change_amount)),\n",
-    "    \"Decrease #\": int(round(total_decrease_returns)),\n",
-    "    \"Decrease %\": round(total_decrease_returns / total_returns * 100, 1),\n",
-    "    \"Total Decrease ($)\": int(round(total_decrease_amount)),\n",
-    "    \"Avg Decrease\": int(round(total_decrease_amount / total_decrease_returns)) if total_decrease_returns > 0 else 0,\n",
-    "    \"Increase #\": int(round(total_increase_returns)),\n",
-    "    \"Increase %\": round(total_increase_returns / total_returns * 100, 1),\n",
-    "    \"Total Increase ($)\": int(round(total_increase_amount)),\n",
-    "    \"Avg Increase\": int(round(total_increase_amount / total_increase_returns)) if total_increase_returns > 0 else 0,\n",
-    "    \"No Change #\": int(round(total_no_change_returns)),\n",
-    "    \"No Change %\": round(total_no_change_returns / total_returns * 100, 1),\n",
-    "    \"Zero Tax #\": int(round(total_zero_tax_returns)),\n",
-    "    \"Zero Tax %\": round(total_zero_tax_returns / total_returns * 100, 1)\n",
-    "}\n",
-    "\n",
-    "df_results = pd.concat([df_results, pd.DataFrame([totals])], ignore_index=True)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "## Results Summary"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 7,
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "====================================================================================================\n",
-      "H. 4216 - ESTIMATED SOUTH CAROLINA INDIVIDUAL INCOME TAX IMPACT\n",
-      "Tax Year 2026\n",
-      "====================================================================================================\n",
-      "\n",
-      "Proposal: Apply a tax rate of 1.99% on taxable income up to $30,000 and 5.39% over,\n",
-      "eliminate the federal standard or itemized deduction, allow a new SC deduction at\n",
-      "certain income levels, and maintain all other state adjustments, exemptions, and credits.\n",
-      "====================================================================================================\n",
-      "\n",
-      "Impact: With this tax structure:\n",
-      "  - 33.1% of taxpayers have a LOWER tax liability\n",
-      "  - 25.1% of taxpayers have a HIGHER tax liability\n",
-      "  - 41.8% are UNCHANGED\n",
-      "\n",
-      "General Fund Impact: $-14,654,645,248\n",
-      "====================================================================================================\n"
-     ]
-    }
-   ],
-   "source": [
-    "print(\"=\"*100)\n",
-    "print(\"H. 4216 - ESTIMATED SOUTH CAROLINA INDIVIDUAL INCOME TAX IMPACT\")\n",
-    "print(f\"Tax Year {TAX_YEAR}\")\n",
-    "print(\"=\"*100)\n",
-    "print(f\"\\nProposal: Apply a tax rate of 1.99% on taxable income up to $30,000 and 5.39% over,\")\n",
-    "print(f\"eliminate the federal standard or itemized deduction, allow a new SC deduction at\")\n",
-    "print(f\"certain income levels, and maintain all other state adjustments, exemptions, and credits.\")\n",
-    "print(\"=\"*100)\n",
-    "\n",
-    "# Summary stats\n",
-    "pct_decrease = total_decrease_returns / total_returns * 100\n",
-    "pct_increase = total_increase_returns / total_returns * 100\n",
-    "pct_unchanged = total_no_change_returns / total_returns * 100\n",
-    "\n",
-    "print(f\"\\nImpact: With this tax structure:\")\n",
-    "print(f\"  - {pct_decrease:.1f}% of taxpayers have a LOWER tax liability\")\n",
-    "print(f\"  - {pct_increase:.1f}% of taxpayers have a HIGHER tax liability\")\n",
-    "print(f\"  - {pct_unchanged:.1f}% are UNCHANGED\")\n",
-    "print(f\"\\nGeneral Fund Impact: ${total_change_amount:,.0f}\")\n",
-    "print(\"=\"*100)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 8,
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "     Federal AGI Range  Est. # Returns  % of Returns  Old Avg Tax  New Avg Tax  Total Change ($)  Decrease #  Decrease %  Increase #  Increase %  No Change %  Zero Tax %\n",
-      "                   $0*          369521          11.5            0            0                 0           0    0.000000           0    0.000000   100.000000  100.000000\n",
-      "         $1 to $10,000          406965          12.7            0            0                 0           0    0.000000           0    0.000000   100.000000  100.000000\n",
-      "    $10,001 to $20,000          295746           9.2            0           11           3145121           0    0.000000       64066   21.700001    78.300003   78.199997\n",
-      "    $20,001 to $30,000          278678           8.7           67           96           8096652        9396    3.400000      127046   45.599998    51.000000   50.799999\n",
-      "    $30,001 to $40,000          252815           7.9          289          243         -11809976      135818   53.700001       39744   15.700000    30.600000   30.200001\n",
-      "    $40,001 to $50,000          204601           6.4          632          459         -35389328      118222   57.799999       47018   23.000000    19.200001   19.200001\n",
-      "    $50,001 to $75,000          407221          12.7         1214         1073         -57309672      273530   67.199997       78571   19.299999    13.500000   13.500000\n",
-      "   $75,001 to $100,000          253742           7.9         2078         2056          -5720177      149558   58.900002       90703   35.700001     5.300000    4.900000\n",
-      "  $100,001 to $150,000          310561           9.7         3694         3875          56132876      147042   47.299999      160837   51.799999     0.900000    0.500000\n",
-      "  $150,001 to $200,000          145460           4.5         6365         6796          62730072       31526   21.700001      113934   78.300003     0.000000    0.000000\n",
-      "  $200,001 to $300,000          100241           3.1         9594        10054          46091116       38119   38.000000       60974   60.799999     1.100000    1.100000\n",
-      "  $300,001 to $500,000          103531           3.2        16932        16233         -72464000       91344   88.199997       11782   11.400000     0.400000    0.400000\n",
-      "$500,001 to $1,000,000           19045           0.6        27051        25511         -29327746       16469   86.500000        2249   11.800000     1.700000    1.700000\n",
-      "       Over $1,000,000           56592           1.8      4277978      4019660      -14618820608       49508   87.500000        7084   12.500000     0.000000    0.000000\n",
-      "                 Total         3204719         100.0        77588        73015      -14654645248     1060532   33.099998      804008   25.100000    41.799999   41.700001\n"
-     ]
-    }
-   ],
-   "source": [
-    "# Display main results table\n",
-    "display_cols = [\n",
-    "    \"Federal AGI Range\", \"Est. # Returns\", \"% of Returns\", \n",
-    "    \"Old Avg Tax\", \"New Avg Tax\", \"Total Change ($)\",\n",
-    "    \"Decrease #\", \"Decrease %\", \"Increase #\", \"Increase %\",\n",
-    "    \"No Change %\", \"Zero Tax %\"\n",
-    "]\n",
-    "\n",
-    "# Convert numpy types to native Python types to avoid display issues\n",
-    "df_display = df_results[display_cols].copy()\n",
-    "for col in df_display.columns:\n",
-    "    if df_display[col].dtype in ['float32', 'float64']:\n",
-    "        df_display[col] = df_display[col].astype(float)\n",
-    "    elif df_display[col].dtype in ['int32', 'int64']:\n",
-    "        df_display[col] = df_display[col].astype(int)\n",
-    "\n",
-    "pd.set_option('display.max_columns', None)\n",
-    "pd.set_option('display.width', None)\n",
-    "\n",
-    "print(df_display.to_string(index=False))"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 9,
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "Full results exported to: sc_h4216_tax_impact_analysis.csv\n"
-     ]
-    }
-   ],
-   "source": [
-    "# Export full results\n",
-    "df_results.to_csv('sc_h4216_tax_impact_analysis.csv', index=False)\n",
-    "print(\"\\nFull results exported to: sc_h4216_tax_impact_analysis.csv\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "## Detailed Breakdown Tables"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 10,
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "================================================================================\n",
-      "ESTIMATED TAX RETURN DISTRIBUTION\n",
-      "================================================================================\n",
-      "     Federal AGI Range  Est. # Returns  % of Returns  Old Avg Tax  New Avg Tax\n",
-      "                   $0*          369521          11.5            0            0\n",
-      "         $1 to $10,000          406965          12.7            0            0\n",
-      "    $10,001 to $20,000          295746           9.2            0           11\n",
-      "    $20,001 to $30,000          278678           8.7           67           96\n",
-      "    $30,001 to $40,000          252815           7.9          289          243\n",
-      "    $40,001 to $50,000          204601           6.4          632          459\n",
-      "    $50,001 to $75,000          407221          12.7         1214         1073\n",
-      "   $75,001 to $100,000          253742           7.9         2078         2056\n",
-      "  $100,001 to $150,000          310561           9.7         3694         3875\n",
-      "  $150,001 to $200,000          145460           4.5         6365         6796\n",
-      "  $200,001 to $300,000          100241           3.1         9594        10054\n",
-      "  $300,001 to $500,000          103531           3.2        16932        16233\n",
-      "$500,001 to $1,000,000           19045           0.6        27051        25511\n",
-      "       Over $1,000,000           56592           1.8      4277978      4019660\n",
-      "                 Total         3204719         100.0        77588        73015\n"
-     ]
-    }
-   ],
-   "source": [
-    "# Tax Return Distribution\n",
-    "print(\"\\n\" + \"=\"*80)\n",
-    "print(\"ESTIMATED TAX RETURN DISTRIBUTION\")\n",
-    "print(\"=\"*80)\n",
-    "dist_cols = [\"Federal AGI Range\", \"Est. # Returns\", \"% of Returns\", \"Old Avg Tax\", \"New Avg Tax\"]\n",
-    "print(df_results[dist_cols].to_string(index=False))"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 11,
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "================================================================================\n",
-      "TAX RETURNS WITH A DECREASE IN LIABILITY\n",
-      "================================================================================\n",
-      "     Federal AGI Range  Decrease #  Decrease %  Total Decrease ($)  Avg Decrease\n",
-      "                   $0*           0    0.000000                   0             0\n",
-      "         $1 to $10,000           0    0.000000                   0             0\n",
-      "    $10,001 to $20,000           0    0.000000                   0             0\n",
-      "    $20,001 to $30,000        9396    3.400000              -50358            -5\n",
-      "    $30,001 to $40,000      135818   53.700001           -14845139          -109\n",
-      "    $40,001 to $50,000      118222   57.799999           -39889976          -337\n",
-      "    $50,001 to $75,000      273530   67.199997           -73336032          -268\n",
-      "   $75,001 to $100,000      149558   58.900002           -36993168          -247\n",
-      "  $100,001 to $150,000      147042   47.299999           -22048396          -150\n",
-      "  $150,001 to $200,000       31526   21.700001           -11001782          -349\n",
-      "  $200,001 to $300,000       38119   38.000000           -21143300          -555\n",
-      "  $300,001 to $500,000       91344   88.199997           -93526784         -1024\n",
-      "$500,001 to $1,000,000       16469   86.500000           -35028512         -2127\n",
-      "       Over $1,000,000       49508   87.500000        -17806082048       -359664\n",
-      "                 Total     1060532   33.099998        -18153947136        -17118\n"
-     ]
-    }
-   ],
-   "source": [
-    "# Tax Decrease Summary\n",
-    "print(\"\\n\" + \"=\"*80)\n",
-    "print(\"TAX RETURNS WITH A DECREASE IN LIABILITY\")\n",
-    "print(\"=\"*80)\n",
-    "decrease_cols = [\"Federal AGI Range\", \"Decrease #\", \"Decrease %\", \"Total Decrease ($)\", \"Avg Decrease\"]\n",
-    "print(df_results[decrease_cols].to_string(index=False))"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 12,
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "================================================================================\n",
-      "TAX RETURNS WITH AN INCREASE IN LIABILITY\n",
-      "================================================================================\n",
-      "     Federal AGI Range  Increase #  Increase %  Total Increase ($)  Avg Increase\n",
-      "                   $0*           0    0.000000                   0             0\n",
-      "         $1 to $10,000           0    0.000000                   0             0\n",
-      "    $10,001 to $20,000       64066   21.700001             3144930            49\n",
-      "    $20,001 to $30,000      127046   45.599998             8146672            64\n",
-      "    $30,001 to $40,000       39744   15.700000             3035304            76\n",
-      "    $40,001 to $50,000       47018   23.000000             4500647            96\n",
-      "    $50,001 to $75,000       78571   19.299999            16026354           204\n",
-      "   $75,001 to $100,000       90703   35.700001            31273924           345\n",
-      "  $100,001 to $150,000      160837   51.799999            78180864           486\n",
-      "  $150,001 to $200,000      113934   78.300003            73731856           647\n",
-      "  $200,001 to $300,000       60974   60.799999            67234448          1103\n",
-      "  $300,001 to $500,000       11782   11.400000            21062782          1788\n",
-      "$500,001 to $1,000,000        2249   11.800000             5700766          2534\n",
-      "       Over $1,000,000        7084   12.500000          3187261952        449920\n",
-      "                 Total      804008   25.100000          3499300352          4352\n"
-     ]
-    }
-   ],
-   "source": [
-    "# Tax Increase Summary\n",
-    "print(\"\\n\" + \"=\"*80)\n",
-    "print(\"TAX RETURNS WITH AN INCREASE IN LIABILITY\")\n",
-    "print(\"=\"*80)\n",
-    "increase_cols = [\"Federal AGI Range\", \"Increase #\", \"Increase %\", \"Total Increase ($)\", \"Avg Increase\"]\n",
-    "print(df_results[increase_cols].to_string(index=False))"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 13,
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "================================================================================\n",
-      "TAX RETURNS WITH NO CHANGE / ZERO TAX LIABILITY\n",
-      "================================================================================\n",
-      "     Federal AGI Range  No Change #  No Change %  Zero Tax #  Zero Tax %\n",
-      "                   $0*       369521   100.000000      369521  100.000000\n",
-      "         $1 to $10,000       406965   100.000000      406965  100.000000\n",
-      "    $10,001 to $20,000       231681    78.300003      231347   78.199997\n",
-      "    $20,001 to $30,000       142236    51.000000      141555   50.799999\n",
-      "    $30,001 to $40,000        77253    30.600000       76459   30.200001\n",
-      "    $40,001 to $50,000        39362    19.200001       39362   19.200001\n",
-      "    $50,001 to $75,000        55120    13.500000       55120   13.500000\n",
-      "   $75,001 to $100,000        13480     5.300000       12472    4.900000\n",
-      "  $100,001 to $150,000         2682     0.900000        1604    0.500000\n",
-      "  $150,001 to $200,000            0     0.000000           0    0.000000\n",
-      "  $200,001 to $300,000         1147     1.100000        1069    1.100000\n",
-      "  $300,001 to $500,000          405     0.400000         405    0.400000\n",
-      "$500,001 to $1,000,000          326     1.700000         326    1.700000\n",
-      "       Over $1,000,000            1     0.000000           1    0.000000\n",
-      "                 Total      1340179    41.799999     1336206   41.700001\n"
-     ]
-    }
-   ],
-   "source": [
-    "# No Change and Zero Tax\n",
-    "print(\"\\n\" + \"=\"*80)\n",
-    "print(\"TAX RETURNS WITH NO CHANGE / ZERO TAX LIABILITY\")\n",
-    "print(\"=\"*80)\n",
-    "other_cols = [\"Federal AGI Range\", \"No Change #\", \"No Change %\", \"Zero Tax #\", \"Zero Tax %\"]\n",
-    "print(df_results[other_cols].to_string(index=False))"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "## Comparison to RFA Fiscal Note\n",
-    "\n",
-    "The SC Revenue & Fiscal Affairs (RFA) Office estimated H.4216 would have a **-$119.1M** General Fund impact.\n",
-    "\n",
-    "Key differences between PolicyEngine and RFA estimates:\n",
-    "- **Population**: PE counts all tax units (filers + non-filers); RFA counts only actual filers\n",
-    "- **Data source**: PE uses CPS-based synthetic data; RFA uses actual SC tax return data\n",
-    "- **Income distribution**: PE has different return counts by income bracket, particularly more millionaires"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 14,
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "================================================================================\n",
-      "COMPARISON: PolicyEngine vs RFA Fiscal Note\n",
-      "================================================================================\n",
-      "\n",
-      "General Fund Impact:\n",
-      "  RFA Estimate:          $   -238,151,000\n",
-      "  PolicyEngine Estimate: $-14,654,645,248\n",
-      "  Difference:            $-14,416,494,248\n",
-      "\n",
-      "  Accuracy vs RFA: -5953.5%\n",
-      "\n",
-      "Total Returns:\n",
-      "  RFA:             5,515,148\n",
-      "  PolicyEngine:    3,204,719\n",
-      "  Difference:     -2,310,428\n"
-     ]
-    }
-   ],
-   "source": [
-    "# Load RFA analysis for comparison\n",
-    "rfa_df = pd.read_csv('rfa_h4216_analysis.csv')\n",
-    "\n",
-    "print(\"=\"*80)\n",
-    "print(\"COMPARISON: PolicyEngine vs RFA Fiscal Note\")\n",
-    "print(\"=\"*80)\n",
-    "\n",
-    "# RFA total impact - parse the dollar string to number\n",
-    "def parse_dollar(val):\n",
-    "    if isinstance(val, str):\n",
-    "        return float(val.replace('$', '').replace(',', '').replace('-', '-'))\n",
-    "    return val\n",
-    "\n",
-    "rfa_df['Total Dollar Change Numeric'] = rfa_df['Total Dollar Change'].apply(parse_dollar)\n",
-    "rfa_total_impact = rfa_df['Total Dollar Change Numeric'].sum()\n",
-    "pe_total_impact = total_change_amount\n",
-    "\n",
-    "print(f\"\\nGeneral Fund Impact:\")\n",
-    "print(f\"  RFA Estimate:          ${rfa_total_impact:>15,.0f}\")\n",
-    "print(f\"  PolicyEngine Estimate: ${pe_total_impact:>15,.0f}\")\n",
-    "print(f\"  Difference:            ${pe_total_impact - rfa_total_impact:>15,.0f}\")\n",
-    "\n",
-    "# Calculate accuracy\n",
-    "accuracy = 1 - abs(pe_total_impact - rfa_total_impact) / abs(rfa_total_impact)\n",
-    "print(f\"\\n  Accuracy vs RFA: {accuracy*100:.1f}%\")\n",
-    "\n",
-    "# Return count comparison\n",
-    "rfa_total_returns = rfa_df['Est # Returns'].sum()\n",
-    "print(f\"\\nTotal Returns:\")\n",
-    "print(f\"  RFA:          {rfa_total_returns:>12,.0f}\")\n",
-    "print(f\"  PolicyEngine: {int(total_returns):>12,.0f}\")\n",
-    "print(f\"  Difference:   {int(total_returns - rfa_total_returns):>+12,.0f}\")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 15,
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "================================================================================\n",
-      "IMPACT BY INCOME BRACKET: PolicyEngine vs RFA\n",
-      "================================================================================\n",
-      "             AGI Range  PE Returns  RFA Returns    PE Impact  RFA Impact      Diff ($)\n",
-      "                   $0*      369521        78854            0   -571000.0  5.710000e+05\n",
-      "         $1 to $10,000      406965            0            0         0.0  0.000000e+00\n",
-      "    $10,001 to $20,000      295746            0      3145121         0.0  3.145121e+06\n",
-      "    $20,001 to $30,000      278678            0      8096652         0.0  8.096652e+06\n",
-      "    $30,001 to $40,000      252815            0    -11809976         0.0 -1.180998e+07\n",
-      "    $40,001 to $50,000      204601            0    -35389328         0.0 -3.538933e+07\n",
-      "    $50,001 to $75,000      407221            0    -57309672         0.0 -5.730967e+07\n",
-      "   $75,001 to $100,000      253742            0     -5720177         0.0 -5.720177e+06\n",
-      "  $100,001 to $150,000      310561            0     56132876         0.0  5.613288e+07\n",
-      "  $150,001 to $200,000      145460            0     62730072         0.0  6.273007e+07\n",
-      "  $200,001 to $300,000      100241            0     46091116         0.0  4.609112e+07\n",
-      "  $300,001 to $500,000      103531            0    -72464000         0.0 -7.246400e+07\n",
-      "$500,001 to $1,000,000       19045            0    -29327746         0.0 -2.932775e+07\n",
-      "       Over $1,000,000       56592            0 -14618820608         0.0 -1.461882e+10\n"
-     ]
-    }
-   ],
-   "source": [
-    "# Side-by-side comparison by income bracket\n",
-    "print(\"\\n\" + \"=\"*80)\n",
-    "print(\"IMPACT BY INCOME BRACKET: PolicyEngine vs RFA\")\n",
-    "print(\"=\"*80)\n",
-    "\n",
-    "# Map PE brackets to RFA brackets for comparison\n",
-    "bracket_comparison = []\n",
-    "for idx, row in df_results.iterrows():\n",
-    "    if row['Federal AGI Range'] == 'Total':\n",
-    "        continue\n",
-    "    \n",
-    "    # Find matching RFA row\n",
-    "    rfa_match = rfa_df[rfa_df['Federal AGI Range'] == row['Federal AGI Range']]\n",
-    "    if len(rfa_match) > 0:\n",
-    "        rfa_impact = rfa_match['Total Dollar Change Numeric'].values[0]\n",
-    "        rfa_returns = rfa_match['Est # Returns'].values[0]\n",
-    "    else:\n",
-    "        rfa_impact = 0\n",
-    "        rfa_returns = 0\n",
-    "    \n",
-    "    bracket_comparison.append({\n",
-    "        'AGI Range': row['Federal AGI Range'],\n",
-    "        'PE Returns': row['Est. # Returns'],\n",
-    "        'RFA Returns': rfa_returns,\n",
-    "        'PE Impact': row['Total Change ($)'],\n",
-    "        'RFA Impact': rfa_impact,\n",
-    "        'Diff ($)': row['Total Change ($)'] - rfa_impact\n",
-    "    })\n",
-    "\n",
-    "comparison_df = pd.DataFrame(bracket_comparison)\n",
-    "print(comparison_df.to_string(index=False))"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "Python 3",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.11.5"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 4
-}
\ No newline at end of file
diff --git a/us/states/sc/sc_h4216_tax_impact_analysis.csv b/us/states/sc/sc_h4216_tax_impact_analysis.csv
deleted file mode 100644
index ba8d6d7..0000000
--- a/us/states/sc/sc_h4216_tax_impact_analysis.csv
+++ /dev/null
@@ -1,16 +0,0 @@
-Federal AGI Range,Est. # Returns,% of Returns,Old Avg Tax,New Avg Tax,Returns w/ Change,% w/ Change,Avg Change,Total Change ($),Decrease #,Decrease %,Total Decrease ($),Avg Decrease,Increase #,Increase %,Total Increase ($),Avg Increase,No Change #,No Change %,Zero Tax #,Zero Tax %
-$0*,369521,11.5,0,0,0,0.0,0,0,0,0.0,0,0,0,0.0,0,0,369521,100.0,369521,100.0
-"$1 to $10,000",406965,12.699999809265137,0,0,0,0.0,0,0,0,0.0,0,0,0,0.0,0,0,406965,100.0,406965,100.0
-"$10,001 to $20,000",295746,9.199999809265137,0,11,64066,21.7,49,3145121,0,0.0,0,0,64066,21.7,3144930,49,231681,78.3,231347,78.2
-"$20,001 to $30,000",278678,8.699999809265137,67,96,136442,49.0,59,8096652,9396,3.4,-50358,-5,127046,45.6,8146672,64,142236,51.0,141555,50.8
-"$30,001 to $40,000",252815,7.900000095367432,289,243,175562,69.4,-67,-11809976,135818,53.7,-14845139,-109,39744,15.7,3035304,76,77253,30.6,76459,30.2
-"$40,001 to $50,000",204601,6.400000095367432,632,459,165240,80.8,-214,-35389328,118222,57.8,-39889976,-337,47018,23.0,4500647,96,39362,19.2,39362,19.2
-"$50,001 to $75,000",407221,12.699999809265137,1214,1073,352101,86.5,-163,-57309672,273530,67.2,-73336032,-268,78571,19.3,16026354,204,55120,13.5,55120,13.5
-"$75,001 to $100,000",253742,7.900000095367432,2078,2056,240262,94.7,-24,-5720177,149558,58.9,-36993168,-247,90703,35.7,31273924,345,13480,5.3,12472,4.9
-"$100,001 to $150,000",310561,9.699999809265137,3694,3875,307879,99.1,182,56132876,147042,47.3,-22048396,-150,160837,51.8,78180864,486,2682,0.9,1604,0.5
-"$150,001 to $200,000",145460,4.5,6365,6796,145460,100.0,431,62730072,31526,21.7,-11001782,-349,113934,78.3,73731856,647,0,0.0,0,0.0
-"$200,001 to $300,000",100241,3.0999999046325684,9594,10054,99094,98.9,465,46091116,38119,38.0,-21143300,-555,60974,60.8,67234448,1103,1147,1.1,1069,1.1
-"$300,001 to $500,000",103531,3.200000047683716,16932,16233,103126,99.6,-703,-72464000,91344,88.2,-93526784,-1024,11782,11.4,21062782,1788,405,0.4,405,0.4
-"$500,001 to $1,000,000",19045,0.6000000238418579,27051,25511,18718,98.3,-1567,-29327746,16469,86.5,-35028512,-2127,2249,11.8,5700766,2534,326,1.7,326,1.7
-"Over $1,000,000",56592,1.7999999523162842,4277978,4019660,56592,100.0,-258322,-14618820608,49508,87.5,-17806082048,-359664,7084,12.5,3187261952,449920,1,0.0,1,0.0
-Total,3204719,100.0,77588,73015,1864540,58.2,-4573,-14654645248,1060532,33.1,-18153947136,-17118,804008,25.1,3499300352,4352,1340179,41.8,1336206,41.7