Skip to content

Commit

Permalink
Remove old code that was commented out
Browse files Browse the repository at this point in the history
  • Loading branch information
martinholmer committed Aug 22, 2024
1 parent 85a0c74 commit 298ad99
Showing 1 changed file with 9 additions and 140 deletions.
149 changes: 9 additions & 140 deletions tax_microdata_benchmarking/datasets/taxcalc_dataset.py
Original file line number Diff line number Diff line change
Expand Up @@ -152,177 +152,46 @@ def pe(variable):
+ pe("estate_income")
+ pe("farm_rent_income")
)

df = pd.DataFrame(var)

"""
df = pd.DataFrame()
df["E03500"] = pe("alimony_expense")
df["E00800"] = pe("alimony_income")
df["G20500"] = pe(
"casualty_loss"
) # Amend with taxdata treatment from e20500
df["E32800"] = pe("cdcc_relevant_expenses")
df["E19800"] = pe("charitable_cash_donations")
df["E20100"] = pe("charitable_non_cash_donations")
df["XTOT"] = pe("exemptions_count")
df["E03240"] = pe("domestic_production_ald")
df["E03400"] = pe("early_withdrawal_penalty")
df["E03220"] = pe("educator_expense")
df["E00200"] = pe("employment_income")
df["E02100"] = pe("farm_income")
df["E27200"] = pe("farm_rent_income")
df["E03290"] = pe("health_savings_account_ald")
df["E19200"] = pe("interest_deduction")
df["P23250"] = pe("long_term_capital_gains")
df["E24518"] = pe("long_term_capital_gains_on_collectibles")
df["E17500"] = pe("medical_expense")
df["E00600"] = pe("non_qualified_dividend_income") + pe(
"qualified_dividend_income"
)
df["E00650"] = pe("qualified_dividend_income")
df["E26270"] = pe("partnership_s_corp_income")
df["E03230"] = pe("qualified_tuition_expenses")
df["E18500"] = pe("real_estate_taxes")
df["E00900"] = pe("self_employment_income")
df["E03270"] = pe("self_employed_health_insurance_ald")
df["E03300"] = pe("self_employed_pension_contribution_ald")
df["P22250"] = pe("short_term_capital_gains")
df["E02400"] = pe("social_security")
df["E18400"] = pe("state_and_local_sales_or_income_tax")
df["E03210"] = pe("student_loan_interest")
df["E00300"] = pe("taxable_interest_income")
df["E01700"] = pe("taxable_pension_income")
df["E02300"] = pe("taxable_unemployment_compensation")
df["E01400"] = pe("taxable_ira_distributions")
df["E00400"] = pe("tax_exempt_interest_income")
df["E01500"] = pe("tax_exempt_pension_income") + pe(
"taxable_pension_income"
)
df["E01700"] = pe("taxable_pension_income")
df["E03150"] = pe("traditional_ira_contributions")
df["E24515"] = pe("unrecaptured_section_1250_gain")
df["E27200"] = pe("farm_rent_income")
df["MARS"] = (
pd.Series(pe("filing_status"))
.map(
{
"SINGLE": 1,
"JOINT": 2,
"SEPARATE": 3,
"HEAD_OF_HOUSEHOLD": 4,
"SURVIVING_SPOUSE": 5,
}
)
.values
)
df["RECID"] = pe("household_id")
df["S006"] = pe("tax_unit_weight")
df["a_lineno"] = 0 # TD-specific (CPS matched person ID)
df["agi_bin"] = 0 # TD-specific (AGI bin)
df["h_seq"] = 0 # TD-specific (CPS matched household ID)
df["ffpos"] = 0 # TD-specific (CPS matched family ID)
df["fips"] = 0 # No FIPS data
df["DSI"] = 0 # Claimed as dependent on another return, assume not
df["EIC"] = np.minimum(pe("eitc_child_count"), 3)
df["FLPDYR"] = year
df["MIDR"] = 0 # Separately filing spouse itemizes, assume not
df["PT_SSTB_income"] = (
0 # Business income is from specified service trade assume not
)
df["tanf_ben"] = 0 # TANF benefits, assume none
df["vet_ben"] = 0 # Veteran's benefits, assume none
df["wic_ben"] = 0 # WIC benefits, assume none
df["snap_ben"] = 0 # SNAP benefits, assume none
df["housing_ben"] = 0 # Housing benefits, assume none
df["ssi_ben"] = 0 # SSI benefits, assume none
df["mcare_ben"] = 0 # Medicare benefits, assume none
df["mcaid_ben"] = 0 # Medicaid benefits, assume none
df["other_ben"] = 0 # Other benefits, assume none
df["PT_binc_w2_wages"] = pe("w2_wages_from_qualified_business")
df["PT_ubia_property"] = 0
df["data_source"] = 1 if "puf" in pe_dataset.__name__.lower() else 0
df["e02000"] = (
pe("rental_income")
+ pe("partnership_s_corp_income")
+ pe("estate_income")
+ pe("farm_rent_income")
)
df["e20400"] = pe("misc_deduction")
df["e07300"] = pe("foreign_tax_credit")
df["e62900"] = pe("amt_foreign_tax_credit")
df["e01200"] = pe("miscellaneous_income")
df["e00700"] = pe("salt_refund_income")
df["e58990"] = pe("investment_income_elected_form_4952")
df["e07400"] = pe("general_business_credit")
df["e07600"] = pe("prior_year_minimum_tax_credit")
df["e11200"] = pe("excess_withheld_payroll_tax")
df["e01100"] = pe("non_sch_d_capital_gains")
df["e87521"] = pe("american_opportunity_credit")
df["e07260"] = pe("energy_efficient_home_improvement_credit")
df["e09900"] = pe("early_withdrawal_penalty")
df["p08000"] = pe("other_credits")
df["e07240"] = pe("savers_credit")
df["e09700"] = pe("recapture_of_investment_credit")
df["e09800"] = pe("unreported_payroll_tax")
df["f2441"] = pe("count_cdcc_eligible")
df["e87530"] = df[
"E03230"
] # Assume same definition for tuition expenses (for now).
df["cmbtp"] = 0
df["f6251"] = 0
df["k1bx14p"] = 0
df["k1bx14s"] = 0
"""

# head and spouse pairs

map_to_tax_unit = lambda arr: pe_sim.map_result(arr, "person", "tax_unit")

filer = pe_sim.calculate("is_tax_unit_head").values
# specify df head/spouse variables
head = pe_sim.calculate("is_tax_unit_head").values
spouse = pe_sim.calculate("is_tax_unit_spouse").values

employment_income = pe_sim.calculate("employment_income").values
self_employment_income = pe_sim.calculate("self_employment_income").values
farm_income = pe_sim.calculate("farm_income").values
pre_tax_contributions = pe_sim.calculate("pre_tax_contributions").values

df["e00200p"] = map_to_tax_unit(employment_income * filer)
df["e00200p"] = map_to_tax_unit(employment_income * head)
df["e00200s"] = map_to_tax_unit(employment_income * spouse)
df["e00900p"] = map_to_tax_unit(self_employment_income * filer)
df["e00900p"] = map_to_tax_unit(self_employment_income * head)
df["e00900s"] = map_to_tax_unit(self_employment_income * spouse)
df["e02100p"] = map_to_tax_unit(farm_income * filer)
df["e02100p"] = map_to_tax_unit(farm_income * head)
df["e02100s"] = map_to_tax_unit(farm_income * spouse)
df["pencon_p"] = map_to_tax_unit(pre_tax_contributions * filer)
df["pencon_p"] = map_to_tax_unit(pre_tax_contributions * head)
df["pencon_s"] = map_to_tax_unit(pre_tax_contributions * spouse)

# Demographics

# specify df demographics
age = pe_sim.calculate("age").values
head = pe_sim.calculate("is_tax_unit_head").values
spouse = pe_sim.calculate("is_tax_unit_spouse").values
dependent = pe_sim.calculate("is_tax_unit_dependent").values
blind = pe_sim.calculate("is_blind").values

df["age_head"] = map_to_tax_unit(age * head)
df["age_spouse"] = map_to_tax_unit(age * spouse)

df["blind_head"] = map_to_tax_unit(blind * head)
df["blind_spouse"] = map_to_tax_unit(blind * spouse)

df["nu18"] = map_to_tax_unit((age < 18) * dependent)
df["nu13"] = map_to_tax_unit((age < 13) * dependent)
df["nu06"] = map_to_tax_unit((age < 6) * dependent)
df["n1820"] = map_to_tax_unit(((age >= 18) & (age < 21)) * dependent)
df["n21"] = map_to_tax_unit((age >= 21) * dependent)
df["n24"] = map_to_tax_unit(
(age < 17) * dependent
) # following taxdata code.
df["n24"] = map_to_tax_unit((age < 17) * dependent) # usinng taxdata logic
df["elderly_dependents"] = map_to_tax_unit((age >= 65) * dependent)

# correct case of variable names for Tax-Calculator
# correct case of df variable names for Tax-Calculator
tc_variable_metadata = yaml.safe_load(
open(STORAGE_FOLDER / "input" / "taxcalc_variable_metadata.yaml", "r")
)
Expand Down

0 comments on commit 298ad99

Please sign in to comment.