Remove old code that was commented out

donboyd5 · Aug 22, 2024 · 13d7686 · 13d7686
1 parent e1b7e76
commit 13d7686
Showing 1 changed file with 9 additions and 140 deletions.
diff --git a/tax_microdata_benchmarking/datasets/taxcalc_dataset.py b/tax_microdata_benchmarking/datasets/taxcalc_dataset.py
@@ -152,177 +152,46 @@ def pe(variable):
         + pe("estate_income")
         + pe("farm_rent_income")
     )
-
     df = pd.DataFrame(var)
 
-    """
-    df = pd.DataFrame()
-
-    df["E03500"] = pe("alimony_expense")
-    df["E00800"] = pe("alimony_income")
-    df["G20500"] = pe(
-        "casualty_loss"
-    )  # Amend with taxdata treatment from e20500
-    df["E32800"] = pe("cdcc_relevant_expenses")
-    df["E19800"] = pe("charitable_cash_donations")
-    df["E20100"] = pe("charitable_non_cash_donations")
-    df["XTOT"] = pe("exemptions_count")
-    df["E03240"] = pe("domestic_production_ald")
-    df["E03400"] = pe("early_withdrawal_penalty")
-    df["E03220"] = pe("educator_expense")
-    df["E00200"] = pe("employment_income")
-    df["E02100"] = pe("farm_income")
-    df["E27200"] = pe("farm_rent_income")
-    df["E03290"] = pe("health_savings_account_ald")
-    df["E19200"] = pe("interest_deduction")
-    df["P23250"] = pe("long_term_capital_gains")
-    df["E24518"] = pe("long_term_capital_gains_on_collectibles")
-    df["E17500"] = pe("medical_expense")
-    df["E00600"] = pe("non_qualified_dividend_income") + pe(
-        "qualified_dividend_income"
-    )
-    df["E00650"] = pe("qualified_dividend_income")
-    df["E26270"] = pe("partnership_s_corp_income")
-    df["E03230"] = pe("qualified_tuition_expenses")
-    df["E18500"] = pe("real_estate_taxes")
-    df["E00900"] = pe("self_employment_income")
-    df["E03270"] = pe("self_employed_health_insurance_ald")
-    df["E03300"] = pe("self_employed_pension_contribution_ald")
-    df["P22250"] = pe("short_term_capital_gains")
-    df["E02400"] = pe("social_security")
-    df["E18400"] = pe("state_and_local_sales_or_income_tax")
-    df["E03210"] = pe("student_loan_interest")
-    df["E00300"] = pe("taxable_interest_income")
-    df["E01700"] = pe("taxable_pension_income")
-    df["E02300"] = pe("taxable_unemployment_compensation")
-    df["E01400"] = pe("taxable_ira_distributions")
-    df["E00400"] = pe("tax_exempt_interest_income")
-    df["E01500"] = pe("tax_exempt_pension_income") + pe(
-        "taxable_pension_income"
-    )
-    df["E01700"] = pe("taxable_pension_income")
-    df["E03150"] = pe("traditional_ira_contributions")
-    df["E24515"] = pe("unrecaptured_section_1250_gain")
-    df["E27200"] = pe("farm_rent_income")
-    df["MARS"] = (
-        pd.Series(pe("filing_status"))
-        .map(
-            {
-                "SINGLE": 1,
-                "JOINT": 2,
-                "SEPARATE": 3,
-                "HEAD_OF_HOUSEHOLD": 4,
-                "SURVIVING_SPOUSE": 5,
-            }
-        )
-        .values
-    )
-    df["RECID"] = pe("household_id")
-    df["S006"] = pe("tax_unit_weight")
-    df["a_lineno"] = 0  # TD-specific (CPS matched person ID)
-    df["agi_bin"] = 0  # TD-specific (AGI bin)
-    df["h_seq"] = 0  # TD-specific (CPS matched household ID)
-    df["ffpos"] = 0  # TD-specific (CPS matched family ID)
-    df["fips"] = 0  # No FIPS data
-    df["DSI"] = 0  # Claimed as dependent on another return, assume not
-    df["EIC"] = np.minimum(pe("eitc_child_count"), 3)
-    df["FLPDYR"] = year
-    df["MIDR"] = 0  # Separately filing spouse itemizes, assume not
-    df["PT_SSTB_income"] = (
-        0  # Business income is from specified service trade assume not
-    )
-    df["tanf_ben"] = 0  # TANF benefits, assume none
-    df["vet_ben"] = 0  # Veteran's benefits, assume none
-    df["wic_ben"] = 0  # WIC benefits, assume none
-    df["snap_ben"] = 0  # SNAP benefits, assume none
-    df["housing_ben"] = 0  # Housing benefits, assume none
-    df["ssi_ben"] = 0  # SSI benefits, assume none
-    df["mcare_ben"] = 0  # Medicare benefits, assume none
-    df["mcaid_ben"] = 0  # Medicaid benefits, assume none
-    df["other_ben"] = 0  # Other benefits, assume none
-    df["PT_binc_w2_wages"] = pe("w2_wages_from_qualified_business")
-    df["PT_ubia_property"] = 0
-    df["data_source"] = 1 if "puf" in pe_dataset.__name__.lower() else 0
-    df["e02000"] = (
-        pe("rental_income")
-        + pe("partnership_s_corp_income")
-        + pe("estate_income")
-        + pe("farm_rent_income")
-    )
-    df["e20400"] = pe("misc_deduction")
-    df["e07300"] = pe("foreign_tax_credit")
-    df["e62900"] = pe("amt_foreign_tax_credit")
-    df["e01200"] = pe("miscellaneous_income")
-    df["e00700"] = pe("salt_refund_income")
-    df["e58990"] = pe("investment_income_elected_form_4952")
-    df["e07400"] = pe("general_business_credit")
-    df["e07600"] = pe("prior_year_minimum_tax_credit")
-    df["e11200"] = pe("excess_withheld_payroll_tax")
-    df["e01100"] = pe("non_sch_d_capital_gains")
-    df["e87521"] = pe("american_opportunity_credit")
-    df["e07260"] = pe("energy_efficient_home_improvement_credit")
-    df["e09900"] = pe("early_withdrawal_penalty")
-    df["p08000"] = pe("other_credits")
-    df["e07240"] = pe("savers_credit")
-    df["e09700"] = pe("recapture_of_investment_credit")
-    df["e09800"] = pe("unreported_payroll_tax")
-    df["f2441"] = pe("count_cdcc_eligible")
-    df["e87530"] = df[
-        "E03230"
-    ]  # Assume same definition for tuition expenses (for now).
-
-    df["cmbtp"] = 0
-    df["f6251"] = 0
-    df["k1bx14p"] = 0
-    df["k1bx14s"] = 0
-    """
-
-    # head and spouse pairs
-
     map_to_tax_unit = lambda arr: pe_sim.map_result(arr, "person", "tax_unit")
 
-    filer = pe_sim.calculate("is_tax_unit_head").values
+    # specify df head/spouse variables
+    head = pe_sim.calculate("is_tax_unit_head").values
     spouse = pe_sim.calculate("is_tax_unit_spouse").values
 
     employment_income = pe_sim.calculate("employment_income").values
     self_employment_income = pe_sim.calculate("self_employment_income").values
     farm_income = pe_sim.calculate("farm_income").values
     pre_tax_contributions = pe_sim.calculate("pre_tax_contributions").values
 
-    df["e00200p"] = map_to_tax_unit(employment_income * filer)
+    df["e00200p"] = map_to_tax_unit(employment_income * head)
     df["e00200s"] = map_to_tax_unit(employment_income * spouse)
-    df["e00900p"] = map_to_tax_unit(self_employment_income * filer)
+    df["e00900p"] = map_to_tax_unit(self_employment_income * head)
     df["e00900s"] = map_to_tax_unit(self_employment_income * spouse)
-    df["e02100p"] = map_to_tax_unit(farm_income * filer)
+    df["e02100p"] = map_to_tax_unit(farm_income * head)
     df["e02100s"] = map_to_tax_unit(farm_income * spouse)
-    df["pencon_p"] = map_to_tax_unit(pre_tax_contributions * filer)
+    df["pencon_p"] = map_to_tax_unit(pre_tax_contributions * head)
     df["pencon_s"] = map_to_tax_unit(pre_tax_contributions * spouse)
 
-    # Demographics
-
+    # specify df demographics
     age = pe_sim.calculate("age").values
-    head = pe_sim.calculate("is_tax_unit_head").values
-    spouse = pe_sim.calculate("is_tax_unit_spouse").values
     dependent = pe_sim.calculate("is_tax_unit_dependent").values
     blind = pe_sim.calculate("is_blind").values
 
     df["age_head"] = map_to_tax_unit(age * head)
     df["age_spouse"] = map_to_tax_unit(age * spouse)
-
     df["blind_head"] = map_to_tax_unit(blind * head)
     df["blind_spouse"] = map_to_tax_unit(blind * spouse)
-
     df["nu18"] = map_to_tax_unit((age < 18) * dependent)
     df["nu13"] = map_to_tax_unit((age < 13) * dependent)
     df["nu06"] = map_to_tax_unit((age < 6) * dependent)
     df["n1820"] = map_to_tax_unit(((age >= 18) & (age < 21)) * dependent)
     df["n21"] = map_to_tax_unit((age >= 21) * dependent)
-    df["n24"] = map_to_tax_unit(
-        (age < 17) * dependent
-    )  # following taxdata code.
+    df["n24"] = map_to_tax_unit((age < 17) * dependent)  # usinng taxdata logic
     df["elderly_dependents"] = map_to_tax_unit((age >= 65) * dependent)
 
-    # correct case of variable names for Tax-Calculator
+    # correct case of df variable names for Tax-Calculator
     tc_variable_metadata = yaml.safe_load(
         open(STORAGE_FOLDER / "input" / "taxcalc_variable_metadata.yaml", "r")
     )