feat(extract): lower US city population threshold to 10K
878 → 4212 cities. Broadens coverage to match the granularity of Eurostat and GeoNames data for smaller metro markets. Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
This commit is contained in:
@@ -33,7 +33,7 @@ ACS_URL = (
|
|||||||
)
|
)
|
||||||
|
|
||||||
REF_YEAR = 2023
|
REF_YEAR = 2023
|
||||||
MIN_POPULATION = 50_000
|
MIN_POPULATION = 10_000
|
||||||
MAX_RETRIES = 2
|
MAX_RETRIES = 2
|
||||||
|
|
||||||
|
|
||||||
@@ -119,7 +119,7 @@ def extract(
|
|||||||
"country_code": "US",
|
"country_code": "US",
|
||||||
})
|
})
|
||||||
|
|
||||||
assert len(rows) > 500, f"Expected >500 US cities ≥50K pop, got {len(rows)} — parse may have failed"
|
assert len(rows) > 2000, f"Expected >2000 US cities ≥10K pop, got {len(rows)} — parse may have failed"
|
||||||
logger.info("parsed %d US cities with population ≥%d", len(rows), MIN_POPULATION)
|
logger.info("parsed %d US cities with population ≥%d", len(rows), MIN_POPULATION)
|
||||||
|
|
||||||
dest_dir = landing_path(landing_dir, "census_usa", year, month)
|
dest_dir = landing_path(landing_dir, "census_usa", year, month)
|
||||||
|
|||||||
Reference in New Issue
Block a user