Skip to content

Commit 61a43e9

Browse files
committed
Update package version
1 parent e0be63b commit 61a43e9

5 files changed

Lines changed: 23 additions & 17 deletions

File tree

CHANGELOG.md

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,10 @@
1+
## [1.112.2] - 2026-05-12
2+
3+
### Changed
4+
5+
- Remove reported SPM WIC, school meals, broadband, and tax inputs from CPS outputs in favor of policyengine-us formulas.
6+
7+
18
## [1.112.1] - 2026-05-12
29

310
### Fixed

changelog.d/remove-reported-spm-inputs.changed

Lines changed: 0 additions & 1 deletion
This file was deleted.

docs/generated/pipeline_api.json

Lines changed: 14 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -61,7 +61,7 @@
6161
"docstring": "\"Add auto loan balance, interest and net_worth variable.",
6262
"id": "add_auto_loan",
6363
"kind": "function",
64-
"line": 2782,
64+
"line": 2775,
6565
"metadata": {
6666
"api_refs": [
6767
"policyengine_us_data.datasets.cps.cps.add_auto_loan_interest_and_net_worth"
@@ -88,7 +88,7 @@
8888
"docstring": "Populate household-level geography variables used by PolicyEngine US.\n\nArgs:\n cps: Output CPS H5 group receiving derived household variables.\n household: Raw CPS household table.",
8989
"id": "add_household_variables",
9090
"kind": "function",
91-
"line": 1444,
91+
"line": 1437,
9292
"metadata": {
9393
"api_refs": [
9494
"policyengine_us_data.datasets.cps.cps.add_household_variables"
@@ -115,7 +115,7 @@
115115
"docstring": "Add basic ID and weight variables.\n\nArgs:\n cps (h5py.File): The CPS dataset file.\n person (DataFrame): The person table of the ASEC.\n tax_unit (DataFrame): The tax unit table created from the person table\n of the ASEC.\n family (DataFrame): The family table of the ASEC.\n spm_unit (DataFrame): The SPM unit table created from the person table\n of the ASEC.\n household (DataFrame): The household table of the ASEC.",
116116
"id": "add_id_variables",
117117
"kind": "function",
118-
"line": 913,
118+
"line": 916,
119119
"metadata": {
120120
"api_refs": [
121121
"policyengine_us_data.datasets.cps.cps.add_id_variables"
@@ -142,7 +142,7 @@
142142
"docstring": "Impute ORG-derived wage and union inputs onto CPS persons.",
143143
"id": "add_org_inputs",
144144
"kind": "function",
145-
"line": 2666,
145+
"line": 2659,
146146
"metadata": {
147147
"api_refs": [
148148
"policyengine_us_data.datasets.cps.cps.add_org_labor_market_inputs"
@@ -169,7 +169,7 @@
169169
"docstring": "Add income variables.\n\nArgs:\n cps (h5py.File): The CPS dataset file.\n person (DataFrame): The CPS person table.\n year (int): The CPS year",
170170
"id": "add_personal_income_variables",
171171
"kind": "function",
172-
"line": 1119,
172+
"line": 1122,
173173
"metadata": {
174174
"api_refs": [
175175
"policyengine_us_data.datasets.cps.cps.add_personal_income_variables"
@@ -196,7 +196,7 @@
196196
"docstring": "Add personal demographic variables.\n\nArgs:\n cps (h5py.File): The CPS dataset file.\n person (DataFrame): The CPS person table.",
197197
"id": "add_personal_variables",
198198
"kind": "function",
199-
"line": 975,
199+
"line": 978,
200200
"metadata": {
201201
"api_refs": [
202202
"policyengine_us_data.datasets.cps.cps.add_personal_variables"
@@ -223,7 +223,7 @@
223223
"docstring": "",
224224
"id": "add_previous_year_income",
225225
"kind": "function",
226-
"line": 1486,
226+
"line": 1479,
227227
"metadata": {
228228
"api_refs": [
229229
"policyengine_us_data.datasets.cps.cps.add_previous_year_income"
@@ -277,7 +277,7 @@
277277
"docstring": "",
278278
"id": "add_spm_variables",
279279
"kind": "function",
280-
"line": 1396,
280+
"line": 1398,
281281
"metadata": {
282282
"api_refs": [
283283
"policyengine_us_data.datasets.cps.cps.add_spm_variables"
@@ -304,7 +304,7 @@
304304
"docstring": "Assign SSN card type using PRCITSHP, employment status, and ASEC-UA conditions.\nCodes:\n- 0: \"NONE\" - Likely undocumented immigrants\n- 1: \"CITIZEN\" - US citizens (born or naturalized)\n- 2: \"NON_CITIZEN_VALID_EAD\" - Non-citizens with work/study authorization\n- 3: \"OTHER_NON_CITIZEN\" - Non-citizens with indicators of legal status",
305305
"id": "add_ssn_card_type",
306306
"kind": "function",
307-
"line": 1592,
307+
"line": 1585,
308308
"metadata": {
309309
"api_refs": [
310310
"policyengine_us_data.datasets.cps.cps.add_ssn_card_type"
@@ -358,7 +358,7 @@
358358
"docstring": "",
359359
"id": "add_tips",
360360
"kind": "function",
361-
"line": 2491,
361+
"line": 2484,
362362
"metadata": {
363363
"api_refs": [
364364
"policyengine_us_data.datasets.cps.cps.add_tips"
@@ -810,7 +810,7 @@
810810
"docstring": "Replace clone-half person-level feature variables with donor matches.",
811811
"id": "clone_features",
812812
"kind": "function",
813-
"line": 409,
813+
"line": 400,
814814
"metadata": {
815815
"api_refs": [
816816
"policyengine_us_data.datasets.cps.extended_cps._splice_clone_feature_predictions"
@@ -936,7 +936,7 @@
936936
"docstring": "Second-stage QRF: train on CPS, predict for PUF clones.\n\nFor the PUF clone half of the extended CPS we need plausible values\nof CPS-only variables (retirement distributions, transfers, hours,\nSPM components, etc.) that are consistent with the clone's\nPUF-imputed income -- not just naively copied from the CPS donor.\n\nWe train a QRF on CPS person-level data where:\n * predictors = demographics + key income variables\n * outputs = CPS-only variables listed in\n ``CPS_ONLY_IMPUTED_VARIABLES``\n\nFor PUF clone prediction we use the PUF-imputed income values\nfrom the second half of ``data`` (the clone half, which already\nhas PUF-imputed income from stage 1).\n\nUses ``fit_predict()`` with ``max_train_samples`` instead of\nmanual sampling + separate fit/predict.\n\nArgs:\n data: Extended dataset dict after ``puf_clone_dataset()`` --\n already doubled, with PUF-imputed income in the second half.\n time_period: Tax year.\n dataset_path: Path to the CPS h5 file for Microsimulation.\n\nReturns:\n DataFrame with one column per CPS-only variable, containing\n predicted values for the PUF clone half (person-level).",
937937
"id": "cps_only",
938938
"kind": "function",
939-
"line": 448,
939+
"line": 439,
940940
"metadata": {
941941
"api_refs": [
942942
"policyengine_us_data.datasets.cps.extended_cps._impute_cps_only_variables"
@@ -1089,7 +1089,7 @@
10891089
"docstring": "Remove variables that are computed by policyengine-us.\n\nVariables with formulas, ``adds``, or ``subtracts`` are\nrecomputed by the simulation engine, so storing them wastes\nspace and can mislead validation.\n\nAggregate variables whose ``adds`` include a behavioral-\nresponse input (e.g. ``employment_income_before_lsr``) are\nrenamed to that input before dropping so the raw data is\npreserved under the correct input-variable name.",
10901090
"id": "formula_drop",
10911091
"kind": "function",
1092-
"line": 1206,
1092+
"line": 1197,
10931093
"metadata": {
10941094
"api_refs": [
10951095
"policyengine_us_data.datasets.cps.extended_cps.ExtendedCPS._drop_formula_variables"
@@ -1950,7 +1950,7 @@
19501950
"docstring": "Replace PUF clone half of CPS-only variables with QRF predictions.\n\nAfter ``puf_clone_dataset()`` the CPS-only variables in the second\nhalf are naive copies of the CPS donor values. This function\nreplaces them with the second-stage QRF predictions that are\nconsistent with the clone's PUF-imputed income.\n\nArgs:\n data: Extended dataset dict (already doubled).\n predictions: DataFrame from ``_impute_cps_only_variables()``.\n time_period: Tax year.\n dataset_path: Path to CPS h5 file for entity mapping.\n\nReturns:\n Modified data dict with CPS-only variables spliced in.",
19511951
"id": "qrf_pass2",
19521952
"kind": "function",
1953-
"line": 726,
1953+
"line": 717,
19541954
"metadata": {
19551955
"api_refs": [
19561956
"policyengine_us_data.datasets.cps.extended_cps._splice_cps_only_predictions"

pyproject.toml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -8,7 +8,7 @@ build-backend = "setuptools.build_meta"
88

99
[project]
1010
name = "policyengine_us_data"
11-
version = "1.112.1"
11+
version = "1.112.2"
1212
description = "A package to create representative microdata for the US."
1313
readme = "README.md"
1414
authors = [

uv.lock

Lines changed: 1 addition & 1 deletion
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

0 commit comments

Comments
 (0)