From df453072eb89e4ec33bc0f33e34fa922d89694ae Mon Sep 17 00:00:00 2001 From: Max Ghenis Date: Sat, 31 Jan 2026 23:20:03 -0500 Subject: [PATCH] Add cps_2024.h5 to HuggingFace upload list MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit The raw (unenhanced) CPS 2024 dataset was never being uploaded to HuggingFace — only enhanced_cps_2024.h5 and small_enhanced_cps_2024.h5 were included. This means downstream consumers couldn't access the raw CPS for the 2024 ASEC survey year. Closes #501 Co-Authored-By: Claude Opus 4.5 --- changelog_entry.yaml | 4 ++++ policyengine_us_data/storage/upload_completed_datasets.py | 2 ++ 2 files changed, 6 insertions(+) diff --git a/changelog_entry.yaml b/changelog_entry.yaml index e69de29bb..e9d926742 100644 --- a/changelog_entry.yaml +++ b/changelog_entry.yaml @@ -0,0 +1,4 @@ +- bump: patch + changes: + added: + - cps_2024.h5 to HuggingFace upload list so the raw (unenhanced) 2024 CPS dataset is published diff --git a/policyengine_us_data/storage/upload_completed_datasets.py b/policyengine_us_data/storage/upload_completed_datasets.py index c8b903cf6..a1e68575c 100644 --- a/policyengine_us_data/storage/upload_completed_datasets.py +++ b/policyengine_us_data/storage/upload_completed_datasets.py @@ -1,6 +1,7 @@ from policyengine_us_data.datasets import ( EnhancedCPS_2024, ) +from policyengine_us_data.datasets.cps.cps import CPS_2024 from policyengine_us_data.storage import STORAGE_FOLDER from policyengine_us_data.utils.data_upload import upload_data_files from google.cloud import storage @@ -10,6 +11,7 @@ def upload_datasets(): dataset_files = [ EnhancedCPS_2024.file_path, + CPS_2024.file_path, STORAGE_FOLDER / "small_enhanced_cps_2024.h5", STORAGE_FOLDER / "calibration" / "policy_data.db", ]