fix: update pipeline imports to use sport modules
After Phase 1 refactoring moved scraper functions to sport-specific modules (nba.py, mlb.py, etc.), these pipeline scripts still imported from scrape_schedules.py. - run_pipeline.py: import from core.py and sport modules - validate_data.py: import from core.py and sport modules - run_canonicalization_pipeline.py: import from core.py and sport modules Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
This commit is contained in:
@@ -29,17 +29,20 @@ from datetime import datetime
|
||||
from pathlib import Path
|
||||
from dataclasses import dataclass, asdict
|
||||
|
||||
# Import pipeline components
|
||||
from scrape_schedules import (
|
||||
# Import from core module
|
||||
from core import (
|
||||
ScraperSource, scrape_with_fallback,
|
||||
# NBA sources
|
||||
scrape_nba_basketball_reference, scrape_nba_espn, scrape_nba_cbssports,
|
||||
# MLB sources
|
||||
scrape_mlb_statsapi, scrape_mlb_baseball_reference, scrape_mlb_espn,
|
||||
# NHL sources
|
||||
scrape_nhl_hockey_reference, scrape_nhl_espn, scrape_nhl_api,
|
||||
# NFL sources
|
||||
scrape_nfl_espn, scrape_nfl_pro_football_reference, scrape_nfl_cbssports,
|
||||
assign_stable_ids, export_to_json,
|
||||
)
|
||||
|
||||
# Import from sport modules
|
||||
from nba import scrape_nba_basketball_reference, scrape_nba_espn, scrape_nba_cbssports
|
||||
from mlb import scrape_mlb_statsapi, scrape_mlb_baseball_reference, scrape_mlb_espn
|
||||
from nhl import scrape_nhl_hockey_reference, scrape_nhl_espn, scrape_nhl_api
|
||||
from nfl import scrape_nfl_espn, scrape_nfl_pro_football_reference, scrape_nfl_cbssports
|
||||
|
||||
# Import secondary sports from scrape_schedules (stubs)
|
||||
from scrape_schedules import (
|
||||
# WNBA sources
|
||||
scrape_wnba_espn, scrape_wnba_basketball_reference, scrape_wnba_cbssports,
|
||||
# MLS sources
|
||||
@@ -50,8 +53,6 @@ from scrape_schedules import (
|
||||
scrape_cbb_espn, scrape_cbb_sports_reference, scrape_cbb_cbssports,
|
||||
# Utilities
|
||||
generate_stadiums_from_teams,
|
||||
assign_stable_ids,
|
||||
export_to_json,
|
||||
)
|
||||
from canonicalize_stadiums import (
|
||||
canonicalize_stadiums,
|
||||
|
||||
@@ -21,17 +21,20 @@ from dataclasses import dataclass
|
||||
from typing import Optional
|
||||
from enum import Enum
|
||||
|
||||
# Import our modules
|
||||
from scrape_schedules import (
|
||||
# Import from core module
|
||||
from core import (
|
||||
Game, Stadium, ScraperSource, scrape_with_fallback,
|
||||
# NBA sources
|
||||
scrape_nba_basketball_reference, scrape_nba_espn, scrape_nba_cbssports,
|
||||
# MLB sources
|
||||
scrape_mlb_statsapi, scrape_mlb_baseball_reference, scrape_mlb_espn,
|
||||
# NHL sources
|
||||
scrape_nhl_hockey_reference, scrape_nhl_espn, scrape_nhl_api,
|
||||
# NFL sources
|
||||
scrape_nfl_espn, scrape_nfl_pro_football_reference, scrape_nfl_cbssports,
|
||||
assign_stable_ids, export_to_json,
|
||||
)
|
||||
|
||||
# Import from sport modules
|
||||
from nba import scrape_nba_basketball_reference, scrape_nba_espn, scrape_nba_cbssports
|
||||
from mlb import scrape_mlb_statsapi, scrape_mlb_baseball_reference, scrape_mlb_espn
|
||||
from nhl import scrape_nhl_hockey_reference, scrape_nhl_espn, scrape_nhl_api
|
||||
from nfl import scrape_nfl_espn, scrape_nfl_pro_football_reference, scrape_nfl_cbssports
|
||||
|
||||
# Import secondary sports from scrape_schedules (stubs)
|
||||
from scrape_schedules import (
|
||||
# WNBA sources
|
||||
scrape_wnba_espn, scrape_wnba_basketball_reference, scrape_wnba_cbssports,
|
||||
# MLS sources
|
||||
@@ -42,8 +45,6 @@ from scrape_schedules import (
|
||||
scrape_cbb_espn, scrape_cbb_sports_reference, scrape_cbb_cbssports,
|
||||
# Utilities
|
||||
generate_stadiums_from_teams,
|
||||
export_to_json,
|
||||
assign_stable_ids,
|
||||
)
|
||||
from validate_data import (
|
||||
validate_games,
|
||||
|
||||
@@ -16,17 +16,19 @@ from dataclasses import dataclass, asdict, field
|
||||
from typing import Optional
|
||||
from collections import defaultdict
|
||||
|
||||
# Import scrapers from main script
|
||||
# Import from core module
|
||||
from core import Game, Stadium, assign_stable_ids
|
||||
|
||||
# Import from sport modules
|
||||
from nba import scrape_nba_basketball_reference, NBA_TEAMS
|
||||
from mlb import scrape_mlb_statsapi, scrape_mlb_baseball_reference, MLB_TEAMS
|
||||
from nhl import scrape_nhl_hockey_reference, NHL_TEAMS
|
||||
from nfl import scrape_nfl_espn, NFL_TEAMS
|
||||
|
||||
# Import secondary sports from scrape_schedules (stubs)
|
||||
from scrape_schedules import (
|
||||
Game, Stadium,
|
||||
scrape_nba_basketball_reference,
|
||||
scrape_mlb_statsapi, scrape_mlb_baseball_reference,
|
||||
scrape_nhl_hockey_reference,
|
||||
scrape_wnba_espn, scrape_mls_espn, scrape_nwsl_espn,
|
||||
scrape_nfl_espn, scrape_cbb_espn,
|
||||
NBA_TEAMS, MLB_TEAMS, NHL_TEAMS, WNBA_TEAMS, MLS_TEAMS, NWSL_TEAMS,
|
||||
NFL_TEAMS,
|
||||
assign_stable_ids,
|
||||
scrape_wnba_espn, scrape_mls_espn, scrape_nwsl_espn, scrape_cbb_espn,
|
||||
WNBA_TEAMS, MLS_TEAMS, NWSL_TEAMS,
|
||||
)
|
||||
|
||||
|
||||
|
||||
Reference in New Issue
Block a user