fix: update pipeline imports to use sport modules
After Phase 1 refactoring moved scraper functions to sport-specific modules (nba.py, mlb.py, etc.), these pipeline scripts still imported from scrape_schedules.py. - run_pipeline.py: import from core.py and sport modules - validate_data.py: import from core.py and sport modules - run_canonicalization_pipeline.py: import from core.py and sport modules Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
This commit is contained in:
@@ -29,17 +29,20 @@ from datetime import datetime
|
|||||||
from pathlib import Path
|
from pathlib import Path
|
||||||
from dataclasses import dataclass, asdict
|
from dataclasses import dataclass, asdict
|
||||||
|
|
||||||
# Import pipeline components
|
# Import from core module
|
||||||
from scrape_schedules import (
|
from core import (
|
||||||
ScraperSource, scrape_with_fallback,
|
ScraperSource, scrape_with_fallback,
|
||||||
# NBA sources
|
assign_stable_ids, export_to_json,
|
||||||
scrape_nba_basketball_reference, scrape_nba_espn, scrape_nba_cbssports,
|
)
|
||||||
# MLB sources
|
|
||||||
scrape_mlb_statsapi, scrape_mlb_baseball_reference, scrape_mlb_espn,
|
# Import from sport modules
|
||||||
# NHL sources
|
from nba import scrape_nba_basketball_reference, scrape_nba_espn, scrape_nba_cbssports
|
||||||
scrape_nhl_hockey_reference, scrape_nhl_espn, scrape_nhl_api,
|
from mlb import scrape_mlb_statsapi, scrape_mlb_baseball_reference, scrape_mlb_espn
|
||||||
# NFL sources
|
from nhl import scrape_nhl_hockey_reference, scrape_nhl_espn, scrape_nhl_api
|
||||||
scrape_nfl_espn, scrape_nfl_pro_football_reference, scrape_nfl_cbssports,
|
from nfl import scrape_nfl_espn, scrape_nfl_pro_football_reference, scrape_nfl_cbssports
|
||||||
|
|
||||||
|
# Import secondary sports from scrape_schedules (stubs)
|
||||||
|
from scrape_schedules import (
|
||||||
# WNBA sources
|
# WNBA sources
|
||||||
scrape_wnba_espn, scrape_wnba_basketball_reference, scrape_wnba_cbssports,
|
scrape_wnba_espn, scrape_wnba_basketball_reference, scrape_wnba_cbssports,
|
||||||
# MLS sources
|
# MLS sources
|
||||||
@@ -50,8 +53,6 @@ from scrape_schedules import (
|
|||||||
scrape_cbb_espn, scrape_cbb_sports_reference, scrape_cbb_cbssports,
|
scrape_cbb_espn, scrape_cbb_sports_reference, scrape_cbb_cbssports,
|
||||||
# Utilities
|
# Utilities
|
||||||
generate_stadiums_from_teams,
|
generate_stadiums_from_teams,
|
||||||
assign_stable_ids,
|
|
||||||
export_to_json,
|
|
||||||
)
|
)
|
||||||
from canonicalize_stadiums import (
|
from canonicalize_stadiums import (
|
||||||
canonicalize_stadiums,
|
canonicalize_stadiums,
|
||||||
|
|||||||
@@ -21,17 +21,20 @@ from dataclasses import dataclass
|
|||||||
from typing import Optional
|
from typing import Optional
|
||||||
from enum import Enum
|
from enum import Enum
|
||||||
|
|
||||||
# Import our modules
|
# Import from core module
|
||||||
from scrape_schedules import (
|
from core import (
|
||||||
Game, Stadium, ScraperSource, scrape_with_fallback,
|
Game, Stadium, ScraperSource, scrape_with_fallback,
|
||||||
# NBA sources
|
assign_stable_ids, export_to_json,
|
||||||
scrape_nba_basketball_reference, scrape_nba_espn, scrape_nba_cbssports,
|
)
|
||||||
# MLB sources
|
|
||||||
scrape_mlb_statsapi, scrape_mlb_baseball_reference, scrape_mlb_espn,
|
# Import from sport modules
|
||||||
# NHL sources
|
from nba import scrape_nba_basketball_reference, scrape_nba_espn, scrape_nba_cbssports
|
||||||
scrape_nhl_hockey_reference, scrape_nhl_espn, scrape_nhl_api,
|
from mlb import scrape_mlb_statsapi, scrape_mlb_baseball_reference, scrape_mlb_espn
|
||||||
# NFL sources
|
from nhl import scrape_nhl_hockey_reference, scrape_nhl_espn, scrape_nhl_api
|
||||||
scrape_nfl_espn, scrape_nfl_pro_football_reference, scrape_nfl_cbssports,
|
from nfl import scrape_nfl_espn, scrape_nfl_pro_football_reference, scrape_nfl_cbssports
|
||||||
|
|
||||||
|
# Import secondary sports from scrape_schedules (stubs)
|
||||||
|
from scrape_schedules import (
|
||||||
# WNBA sources
|
# WNBA sources
|
||||||
scrape_wnba_espn, scrape_wnba_basketball_reference, scrape_wnba_cbssports,
|
scrape_wnba_espn, scrape_wnba_basketball_reference, scrape_wnba_cbssports,
|
||||||
# MLS sources
|
# MLS sources
|
||||||
@@ -42,8 +45,6 @@ from scrape_schedules import (
|
|||||||
scrape_cbb_espn, scrape_cbb_sports_reference, scrape_cbb_cbssports,
|
scrape_cbb_espn, scrape_cbb_sports_reference, scrape_cbb_cbssports,
|
||||||
# Utilities
|
# Utilities
|
||||||
generate_stadiums_from_teams,
|
generate_stadiums_from_teams,
|
||||||
export_to_json,
|
|
||||||
assign_stable_ids,
|
|
||||||
)
|
)
|
||||||
from validate_data import (
|
from validate_data import (
|
||||||
validate_games,
|
validate_games,
|
||||||
|
|||||||
@@ -16,17 +16,19 @@ from dataclasses import dataclass, asdict, field
|
|||||||
from typing import Optional
|
from typing import Optional
|
||||||
from collections import defaultdict
|
from collections import defaultdict
|
||||||
|
|
||||||
# Import scrapers from main script
|
# Import from core module
|
||||||
|
from core import Game, Stadium, assign_stable_ids
|
||||||
|
|
||||||
|
# Import from sport modules
|
||||||
|
from nba import scrape_nba_basketball_reference, NBA_TEAMS
|
||||||
|
from mlb import scrape_mlb_statsapi, scrape_mlb_baseball_reference, MLB_TEAMS
|
||||||
|
from nhl import scrape_nhl_hockey_reference, NHL_TEAMS
|
||||||
|
from nfl import scrape_nfl_espn, NFL_TEAMS
|
||||||
|
|
||||||
|
# Import secondary sports from scrape_schedules (stubs)
|
||||||
from scrape_schedules import (
|
from scrape_schedules import (
|
||||||
Game, Stadium,
|
scrape_wnba_espn, scrape_mls_espn, scrape_nwsl_espn, scrape_cbb_espn,
|
||||||
scrape_nba_basketball_reference,
|
WNBA_TEAMS, MLS_TEAMS, NWSL_TEAMS,
|
||||||
scrape_mlb_statsapi, scrape_mlb_baseball_reference,
|
|
||||||
scrape_nhl_hockey_reference,
|
|
||||||
scrape_wnba_espn, scrape_mls_espn, scrape_nwsl_espn,
|
|
||||||
scrape_nfl_espn, scrape_cbb_espn,
|
|
||||||
NBA_TEAMS, MLB_TEAMS, NHL_TEAMS, WNBA_TEAMS, MLS_TEAMS, NWSL_TEAMS,
|
|
||||||
NFL_TEAMS,
|
|
||||||
assign_stable_ids,
|
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user