feat(scripts): complete data pipeline remediation
Scripts changes: - Add WNBA abbreviation aliases to team_resolver.py - Fix NHL stadium coordinates in stadium_resolver.py - Add validate_aliases.py script for orphan detection - Update scrapers with improved error handling - Add DATA_AUDIT.md and REMEDIATION_PLAN.md documentation - Update alias JSON files with new mappings iOS bundle updates: - Update games_canonical.json with latest scraped data - Update teams_canonical.json and stadiums_canonical.json - Sync alias files with Scripts versions All 5 remediation phases complete. Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
This commit is contained in:
@@ -583,25 +583,25 @@
|
||||
},
|
||||
{
|
||||
"alias_name": "mercedes-benz stadium",
|
||||
"stadium_canonical_id": "stadium_nfl_mercedesbenz_stadium",
|
||||
"stadium_canonical_id": "stadium_nfl_mercedes_benz_stadium",
|
||||
"valid_from": null,
|
||||
"valid_until": null
|
||||
},
|
||||
{
|
||||
"alias_name": "mercedesbenz stadium",
|
||||
"stadium_canonical_id": "stadium_nfl_mercedesbenz_stadium",
|
||||
"stadium_canonical_id": "stadium_nfl_mercedes_benz_stadium",
|
||||
"valid_from": null,
|
||||
"valid_until": null
|
||||
},
|
||||
{
|
||||
"alias_name": "m&t bank stadium",
|
||||
"stadium_canonical_id": "stadium_nfl_mt_bank_stadium",
|
||||
"stadium_canonical_id": "stadium_nfl_mandt_bank_stadium",
|
||||
"valid_from": null,
|
||||
"valid_until": null
|
||||
},
|
||||
{
|
||||
"alias_name": "mt bank stadium",
|
||||
"stadium_canonical_id": "stadium_nfl_mt_bank_stadium",
|
||||
"stadium_canonical_id": "stadium_nfl_mandt_bank_stadium",
|
||||
"valid_from": null,
|
||||
"valid_until": null
|
||||
},
|
||||
@@ -631,7 +631,7 @@
|
||||
},
|
||||
{
|
||||
"alias_name": "cleveland browns stadium",
|
||||
"stadium_canonical_id": "stadium_nfl_cleveland_browns_stadium",
|
||||
"stadium_canonical_id": "stadium_nfl_huntington_bank_field",
|
||||
"valid_from": null,
|
||||
"valid_until": null
|
||||
},
|
||||
@@ -649,7 +649,7 @@
|
||||
},
|
||||
{
|
||||
"alias_name": "empower field at mile high",
|
||||
"stadium_canonical_id": "stadium_nfl_empower_field_at_mile_high",
|
||||
"stadium_canonical_id": "stadium_nfl_empower_field",
|
||||
"valid_from": null,
|
||||
"valid_until": null
|
||||
},
|
||||
@@ -685,7 +685,7 @@
|
||||
},
|
||||
{
|
||||
"alias_name": "geha field at arrowhead stadium",
|
||||
"stadium_canonical_id": "stadium_nfl_geha_field_at_arrowhead_stadium",
|
||||
"stadium_canonical_id": "stadium_nfl_arrowhead_stadium",
|
||||
"valid_from": null,
|
||||
"valid_until": null
|
||||
},
|
||||
@@ -787,13 +787,13 @@
|
||||
},
|
||||
{
|
||||
"alias_name": "mercedes-benz stadium",
|
||||
"stadium_canonical_id": "stadium_mls_mercedesbenz_stadium",
|
||||
"stadium_canonical_id": "stadium_mls_mercedes_benz_stadium",
|
||||
"valid_from": null,
|
||||
"valid_until": null
|
||||
},
|
||||
{
|
||||
"alias_name": "mercedesbenz stadium",
|
||||
"stadium_canonical_id": "stadium_mls_mercedesbenz_stadium",
|
||||
"stadium_canonical_id": "stadium_mls_mercedes_benz_stadium",
|
||||
"valid_from": null,
|
||||
"valid_until": null
|
||||
},
|
||||
@@ -1405,25 +1405,25 @@
|
||||
},
|
||||
{
|
||||
"alias_name": "broncos stadium at mile high",
|
||||
"stadium_canonical_id": "stadium_nfl_empower_field_at_mile_high",
|
||||
"stadium_canonical_id": "stadium_nfl_empower_field",
|
||||
"valid_from": "2018-09-01",
|
||||
"valid_until": "2019-08-31"
|
||||
},
|
||||
{
|
||||
"alias_name": "sports authority field at mile high",
|
||||
"stadium_canonical_id": "stadium_nfl_empower_field_at_mile_high",
|
||||
"stadium_canonical_id": "stadium_nfl_empower_field",
|
||||
"valid_from": "2011-08-01",
|
||||
"valid_until": "2018-08-31"
|
||||
},
|
||||
{
|
||||
"alias_name": "invesco field at mile high",
|
||||
"stadium_canonical_id": "stadium_nfl_empower_field_at_mile_high",
|
||||
"stadium_canonical_id": "stadium_nfl_empower_field",
|
||||
"valid_from": "2001-09-01",
|
||||
"valid_until": "2011-07-31"
|
||||
},
|
||||
{
|
||||
"alias_name": "mile high stadium",
|
||||
"stadium_canonical_id": "stadium_nfl_empower_field_at_mile_high",
|
||||
"stadium_canonical_id": "stadium_nfl_empower_field",
|
||||
"valid_from": "1960-01-01",
|
||||
"valid_until": "2001-08-31"
|
||||
},
|
||||
@@ -1531,7 +1531,7 @@
|
||||
},
|
||||
{
|
||||
"alias_name": "arrowhead stadium",
|
||||
"stadium_canonical_id": "stadium_nfl_geha_field_at_arrowhead_stadium",
|
||||
"stadium_canonical_id": "stadium_nfl_arrowhead_stadium",
|
||||
"valid_from": "1972-08-01",
|
||||
"valid_until": null
|
||||
},
|
||||
@@ -1924,5 +1924,113 @@
|
||||
"stadium_canonical_id": "stadium_mlb_journey_bank_ballpark",
|
||||
"valid_from": null,
|
||||
"valid_until": null
|
||||
},
|
||||
{
|
||||
"alias_name": "mortgage matchup center",
|
||||
"stadium_canonical_id": "stadium_nba_rocket_mortgage_fieldhouse",
|
||||
"valid_from": "2025-01-01",
|
||||
"valid_until": null
|
||||
},
|
||||
{
|
||||
"alias_name": "xfinity mobile arena",
|
||||
"stadium_canonical_id": "stadium_nba_intuit_dome",
|
||||
"valid_from": "2025-01-01",
|
||||
"valid_until": null
|
||||
},
|
||||
{
|
||||
"alias_name": "rocket arena",
|
||||
"stadium_canonical_id": "stadium_nba_toyota_center",
|
||||
"valid_from": "2025-01-01",
|
||||
"valid_until": null
|
||||
},
|
||||
{
|
||||
"alias_name": "mexico city arena",
|
||||
"stadium_canonical_id": "stadium_nba_mexico_city_arena",
|
||||
"valid_from": null,
|
||||
"valid_until": null
|
||||
},
|
||||
{
|
||||
"alias_name": "arena cdmx",
|
||||
"stadium_canonical_id": "stadium_nba_mexico_city_arena",
|
||||
"valid_from": null,
|
||||
"valid_until": null
|
||||
},
|
||||
{
|
||||
"alias_name": "scottsmiracle-gro field",
|
||||
"stadium_canonical_id": "stadium_mls_lowercom_field",
|
||||
"valid_from": "2025-01-01",
|
||||
"valid_until": null
|
||||
},
|
||||
{
|
||||
"alias_name": "scotts miracle-gro field",
|
||||
"stadium_canonical_id": "stadium_mls_lowercom_field",
|
||||
"valid_from": "2025-01-01",
|
||||
"valid_until": null
|
||||
},
|
||||
{
|
||||
"alias_name": "energizer park",
|
||||
"stadium_canonical_id": "stadium_mls_citypark",
|
||||
"valid_from": "2025-01-01",
|
||||
"valid_until": null
|
||||
},
|
||||
{
|
||||
"alias_name": "sports illustrated stadium",
|
||||
"stadium_canonical_id": "stadium_mls_red_bull_arena",
|
||||
"valid_from": "2025-01-01",
|
||||
"valid_until": null
|
||||
},
|
||||
{
|
||||
"alias_name": "sports illustrated stadium",
|
||||
"stadium_canonical_id": "stadium_nwsl_red_bull_arena",
|
||||
"valid_from": "2025-01-01",
|
||||
"valid_until": null
|
||||
},
|
||||
{
|
||||
"alias_name": "soldier field",
|
||||
"stadium_canonical_id": "stadium_nwsl_soldier_field",
|
||||
"valid_from": null,
|
||||
"valid_until": null
|
||||
},
|
||||
{
|
||||
"alias_name": "oracle park",
|
||||
"stadium_canonical_id": "stadium_nwsl_oracle_park",
|
||||
"valid_from": null,
|
||||
"valid_until": null
|
||||
},
|
||||
{
|
||||
"alias_name": "carefirst arena",
|
||||
"stadium_canonical_id": "stadium_wnba_entertainment_sports_arena",
|
||||
"valid_from": "2025-01-01",
|
||||
"valid_until": null
|
||||
},
|
||||
{
|
||||
"alias_name": "care first arena",
|
||||
"stadium_canonical_id": "stadium_wnba_entertainment_sports_arena",
|
||||
"valid_from": "2025-01-01",
|
||||
"valid_until": null
|
||||
},
|
||||
{
|
||||
"alias_name": "mortgage matchup center",
|
||||
"stadium_canonical_id": "stadium_wnba_rocket_mortgage_fieldhouse",
|
||||
"valid_from": "2025-01-01",
|
||||
"valid_until": null
|
||||
},
|
||||
{
|
||||
"alias_name": "state farm arena",
|
||||
"stadium_canonical_id": "stadium_wnba_state_farm_arena",
|
||||
"valid_from": null,
|
||||
"valid_until": null
|
||||
},
|
||||
{
|
||||
"alias_name": "cfg bank arena",
|
||||
"stadium_canonical_id": "stadium_wnba_cfg_bank_arena",
|
||||
"valid_from": null,
|
||||
"valid_until": null
|
||||
},
|
||||
{
|
||||
"alias_name": "purcell pavilion",
|
||||
"stadium_canonical_id": "stadium_wnba_purcell_pavilion",
|
||||
"valid_from": null,
|
||||
"valid_until": null
|
||||
}
|
||||
]
|
||||
Reference in New Issue
Block a user