fix: update pipeline imports to use sport modules

After Phase 1 refactoring moved scraper functions to sport-specific
modules (nba.py, mlb.py, etc.), these pipeline scripts still imported
from scrape_schedules.py.

- run_pipeline.py: import from core.py and sport modules
- validate_data.py: import from core.py and sport modules
- run_canonicalization_pipeline.py: import from core.py and sport modules

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
This commit is contained in:
Trey t
2026-01-10 10:52:13 -06:00
parent 78f08449fc
commit 63fb06c41a
3 changed files with 38 additions and 34 deletions

View File

@@ -29,17 +29,20 @@ from datetime import datetime
from pathlib import Path
from dataclasses import dataclass, asdict
# Import pipeline components
from scrape_schedules import (
# Import from core module
from core import (
ScraperSource, scrape_with_fallback,
# NBA sources
scrape_nba_basketball_reference, scrape_nba_espn, scrape_nba_cbssports,
# MLB sources
scrape_mlb_statsapi, scrape_mlb_baseball_reference, scrape_mlb_espn,
# NHL sources
scrape_nhl_hockey_reference, scrape_nhl_espn, scrape_nhl_api,
# NFL sources
scrape_nfl_espn, scrape_nfl_pro_football_reference, scrape_nfl_cbssports,
assign_stable_ids, export_to_json,
)
# Import from sport modules
from nba import scrape_nba_basketball_reference, scrape_nba_espn, scrape_nba_cbssports
from mlb import scrape_mlb_statsapi, scrape_mlb_baseball_reference, scrape_mlb_espn
from nhl import scrape_nhl_hockey_reference, scrape_nhl_espn, scrape_nhl_api
from nfl import scrape_nfl_espn, scrape_nfl_pro_football_reference, scrape_nfl_cbssports
# Import secondary sports from scrape_schedules (stubs)
from scrape_schedules import (
# WNBA sources
scrape_wnba_espn, scrape_wnba_basketball_reference, scrape_wnba_cbssports,
# MLS sources
@@ -50,8 +53,6 @@ from scrape_schedules import (
scrape_cbb_espn, scrape_cbb_sports_reference, scrape_cbb_cbssports,
# Utilities
generate_stadiums_from_teams,
assign_stable_ids,
export_to_json,
)
from canonicalize_stadiums import (
canonicalize_stadiums,

View File

@@ -21,17 +21,20 @@ from dataclasses import dataclass
from typing import Optional
from enum import Enum
# Import our modules
from scrape_schedules import (
# Import from core module
from core import (
Game, Stadium, ScraperSource, scrape_with_fallback,
# NBA sources
scrape_nba_basketball_reference, scrape_nba_espn, scrape_nba_cbssports,
# MLB sources
scrape_mlb_statsapi, scrape_mlb_baseball_reference, scrape_mlb_espn,
# NHL sources
scrape_nhl_hockey_reference, scrape_nhl_espn, scrape_nhl_api,
# NFL sources
scrape_nfl_espn, scrape_nfl_pro_football_reference, scrape_nfl_cbssports,
assign_stable_ids, export_to_json,
)
# Import from sport modules
from nba import scrape_nba_basketball_reference, scrape_nba_espn, scrape_nba_cbssports
from mlb import scrape_mlb_statsapi, scrape_mlb_baseball_reference, scrape_mlb_espn
from nhl import scrape_nhl_hockey_reference, scrape_nhl_espn, scrape_nhl_api
from nfl import scrape_nfl_espn, scrape_nfl_pro_football_reference, scrape_nfl_cbssports
# Import secondary sports from scrape_schedules (stubs)
from scrape_schedules import (
# WNBA sources
scrape_wnba_espn, scrape_wnba_basketball_reference, scrape_wnba_cbssports,
# MLS sources
@@ -42,8 +45,6 @@ from scrape_schedules import (
scrape_cbb_espn, scrape_cbb_sports_reference, scrape_cbb_cbssports,
# Utilities
generate_stadiums_from_teams,
export_to_json,
assign_stable_ids,
)
from validate_data import (
validate_games,

View File

@@ -16,17 +16,19 @@ from dataclasses import dataclass, asdict, field
from typing import Optional
from collections import defaultdict
# Import scrapers from main script
# Import from core module
from core import Game, Stadium, assign_stable_ids
# Import from sport modules
from nba import scrape_nba_basketball_reference, NBA_TEAMS
from mlb import scrape_mlb_statsapi, scrape_mlb_baseball_reference, MLB_TEAMS
from nhl import scrape_nhl_hockey_reference, NHL_TEAMS
from nfl import scrape_nfl_espn, NFL_TEAMS
# Import secondary sports from scrape_schedules (stubs)
from scrape_schedules import (
Game, Stadium,
scrape_nba_basketball_reference,
scrape_mlb_statsapi, scrape_mlb_baseball_reference,
scrape_nhl_hockey_reference,
scrape_wnba_espn, scrape_mls_espn, scrape_nwsl_espn,
scrape_nfl_espn, scrape_cbb_espn,
NBA_TEAMS, MLB_TEAMS, NHL_TEAMS, WNBA_TEAMS, MLS_TEAMS, NWSL_TEAMS,
NFL_TEAMS,
assign_stable_ids,
scrape_wnba_espn, scrape_mls_espn, scrape_nwsl_espn, scrape_cbb_espn,
WNBA_TEAMS, MLS_TEAMS, NWSL_TEAMS,
)