anth-volk commited on
Commit
743c45d
Β·
verified Β·
1 Parent(s): 22d4ccf

Upload test/target_config.yaml with huggingface_hub

Browse files
Files changed (1) hide show
  1. test/target_config.yaml +119 -0
test/target_config.yaml ADDED
@@ -0,0 +1,119 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ include:
3
+ # === DISTRICT β€” age demographics ===
4
+ - variable: person_count
5
+ geo_level: district
6
+ domain_variable: age
7
+
8
+ # === DISTRICT β€” count targets ===
9
+ # REMOVED: person_count by AGI β€” filer-gated, all AGI bins 100% underestimated
10
+ - variable: household_count
11
+ geo_level: district
12
+
13
+ # === DISTRICT β€” dollar targets (all <8% mean error, restored) ===
14
+ - variable: real_estate_taxes
15
+ geo_level: district
16
+ - variable: self_employment_income
17
+ geo_level: district
18
+ - variable: taxable_pension_income
19
+ geo_level: district
20
+ - variable: refundable_ctc
21
+ geo_level: district
22
+ - variable: unemployment_compensation
23
+ geo_level: district
24
+
25
+ # === DISTRICT β€” ACA PTC (2% mean error, restored) ===
26
+ - variable: aca_ptc
27
+ geo_level: district
28
+ - variable: tax_unit_count
29
+ geo_level: district
30
+ domain_variable: aca_ptc
31
+
32
+ # === STATE ===
33
+ - variable: person_count
34
+ geo_level: state
35
+ domain_variable: medicaid_enrolled
36
+ # REMOVED: is_pregnant β€” 100% unachievable across all 51 state geos
37
+ - variable: snap
38
+ geo_level: state
39
+
40
+ # === NATIONAL β€” aggregate dollar targets ===
41
+ # REMOVED: adjusted_gross_income β€” filer-gated
42
+ - variable: child_support_expense
43
+ geo_level: national
44
+ - variable: child_support_received
45
+ geo_level: national
46
+ # REMOVED: eitc β€” filer-gated
47
+ - variable: health_insurance_premiums_without_medicare_part_b
48
+ geo_level: national
49
+ - variable: medicaid
50
+ geo_level: national
51
+ - variable: medicare_part_b_premiums
52
+ geo_level: national
53
+ - variable: other_medical_expenses
54
+ geo_level: national
55
+ - variable: over_the_counter_health_expenses
56
+ geo_level: national
57
+ # REMOVED: qualified_business_income_deduction β€” filer-gated
58
+ - variable: rent
59
+ geo_level: national
60
+ # REMOVED: salt_deduction β€” 11.3x overestimate, worst variable in model
61
+ - variable: snap
62
+ geo_level: national
63
+ - variable: social_security
64
+ geo_level: national
65
+ - variable: social_security_disability
66
+ geo_level: national
67
+ - variable: social_security_retirement
68
+ geo_level: national
69
+ - variable: spm_unit_capped_housing_subsidy
70
+ geo_level: national
71
+ - variable: spm_unit_capped_work_childcare_expenses
72
+ geo_level: national
73
+ - variable: ssi
74
+ geo_level: national
75
+ - variable: tanf
76
+ geo_level: national
77
+ # REMOVED: tip_income β€” filer-gated
78
+ - variable: unemployment_compensation
79
+ geo_level: national
80
+
81
+ # === NATIONAL β€” IRS SOI domain-constrained dollar targets (restored: |rel_err| < 15%) ===
82
+ - variable: aca_ptc
83
+ geo_level: national
84
+ domain_variable: aca_ptc
85
+ - variable: net_capital_gains
86
+ geo_level: national
87
+ domain_variable: net_capital_gains
88
+ - variable: refundable_ctc
89
+ geo_level: national
90
+ domain_variable: refundable_ctc
91
+ - variable: self_employment_income
92
+ geo_level: national
93
+ domain_variable: self_employment_income
94
+ - variable: tax_unit_partnership_s_corp_income
95
+ geo_level: national
96
+ domain_variable: tax_unit_partnership_s_corp_income
97
+ - variable: taxable_pension_income
98
+ geo_level: national
99
+ domain_variable: taxable_pension_income
100
+ - variable: unemployment_compensation
101
+ geo_level: national
102
+ domain_variable: unemployment_compensation
103
+ # REMOVED (|rel_err| > 15% or tension with counts):
104
+ # adjusted_gross_income (28%), dividend_income (26%, tension), eitc (23%),
105
+ # eitc by child_count (14-77%, tension), income_tax_before_credits (21%),
106
+ # income_tax_positive (22%), qualified_business_income_deduction (55-63%),
107
+ # qualified_dividend_income (29%, tension), rental_income (20%),
108
+ # salt (102%), salt_deduction (1130%), tax_exempt_interest_income (61%),
109
+ # taxable_interest_income (61%), taxable_ira_distributions (68%),
110
+ # taxable_social_security (55%)
111
+
112
+ # === NATIONAL β€” IRS SOI filer count targets (restored: |rel_err| < 10%) ===
113
+ - variable: tax_unit_count
114
+ geo_level: national
115
+ domain_variable: aca_ptc
116
+ - variable: tax_unit_count
117
+ geo_level: national
118
+ domain_variable: refundable_ctc
119
+ # REMOVED (|rel_err| > 10%): all other filer count targets (22-706% error)