diff --git a/changelog.d/fix-enhanced-cps-overwrite.fixed.md b/changelog.d/fix-enhanced-cps-overwrite.fixed.md new file mode 100644 index 00000000..3faa4c36 --- /dev/null +++ b/changelog.d/fix-enhanced-cps-overwrite.fixed.md @@ -0,0 +1 @@ +Fix create_sparse_ecps overwriting enhanced_cps_2024.h5 with sparse version that drops input variables like employment_income. diff --git a/policyengine_us_data/datasets/cps/small_enhanced_cps.py b/policyengine_us_data/datasets/cps/small_enhanced_cps.py index 5e099bec..ccee6458 100644 --- a/policyengine_us_data/datasets/cps/small_enhanced_cps.py +++ b/policyengine_us_data/datasets/cps/small_enhanced_cps.py @@ -104,7 +104,7 @@ def create_sparse_ecps(): if len(data[variable]) == 0: del data[variable] - with h5py.File(STORAGE_FOLDER / "enhanced_cps_2024.h5", "w") as f: + with h5py.File(STORAGE_FOLDER / "sparse_enhanced_cps_2024.h5", "w") as f: for variable, periods in data.items(): grp = f.create_group(variable) for period, values in periods.items():