From 1fc348f10cb1760bb360f7764b85e55af5646abf Mon Sep 17 00:00:00 2001 From: Deeman Date: Thu, 26 Feb 2026 00:02:40 +0100 Subject: [PATCH] feat(extract): lower US city population threshold to 10K MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit 878 → 4212 cities. Broadens coverage to match the granularity of Eurostat and GeoNames data for smaller metro markets. Co-Authored-By: Claude Sonnet 4.6 --- .../padelnomics_extract/src/padelnomics_extract/census_usa.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/extract/padelnomics_extract/src/padelnomics_extract/census_usa.py b/extract/padelnomics_extract/src/padelnomics_extract/census_usa.py index 657bc05..91e35a8 100644 --- a/extract/padelnomics_extract/src/padelnomics_extract/census_usa.py +++ b/extract/padelnomics_extract/src/padelnomics_extract/census_usa.py @@ -33,7 +33,7 @@ ACS_URL = ( ) REF_YEAR = 2023 -MIN_POPULATION = 50_000 +MIN_POPULATION = 10_000 MAX_RETRIES = 2 @@ -119,7 +119,7 @@ def extract( "country_code": "US", }) - assert len(rows) > 500, f"Expected >500 US cities ≥50K pop, got {len(rows)} — parse may have failed" + assert len(rows) > 2000, f"Expected >2000 US cities ≥10K pop, got {len(rows)} — parse may have failed" logger.info("parsed %d US cities with population ≥%d", len(rows), MIN_POPULATION) dest_dir = landing_path(landing_dir, "census_usa", year, month)