feat(scripts): add sportstime-parser data pipeline
Complete Python package for scraping, normalizing, and uploading sports schedule data to CloudKit. Includes: - Multi-source scrapers for NBA, MLB, NFL, NHL, MLS, WNBA, NWSL - Canonical ID system for teams, stadiums, and games - Fuzzy matching with manual alias support - CloudKit uploader with batch operations and deduplication - Comprehensive test suite with fixtures - WNBA abbreviation aliases for improved team resolution - Alias validation script to detect orphan references All 5 phases of data remediation plan completed: - Phase 1: Alias fixes (team/stadium alias additions) - Phase 2: NHL stadium coordinate fixes - Phase 3: Re-scrape validation - Phase 4: iOS bundle update - Phase 5: Code quality improvements (WNBA aliases) Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
This commit is contained in:
46
sportstime_parser/scrapers/__init__.py
Normal file
46
sportstime_parser/scrapers/__init__.py
Normal file
@@ -0,0 +1,46 @@
|
||||
"""Scrapers for fetching sports data from various sources."""
|
||||
|
||||
from .base import (
|
||||
BaseScraper,
|
||||
RawGameData,
|
||||
ScrapeResult,
|
||||
ScraperError,
|
||||
PartialDataError,
|
||||
)
|
||||
from .nba import NBAScraper, create_nba_scraper
|
||||
from .mlb import MLBScraper, create_mlb_scraper
|
||||
from .nfl import NFLScraper, create_nfl_scraper
|
||||
from .nhl import NHLScraper, create_nhl_scraper
|
||||
from .mls import MLSScraper, create_mls_scraper
|
||||
from .wnba import WNBAScraper, create_wnba_scraper
|
||||
from .nwsl import NWSLScraper, create_nwsl_scraper
|
||||
|
||||
__all__ = [
|
||||
# Base
|
||||
"BaseScraper",
|
||||
"RawGameData",
|
||||
"ScrapeResult",
|
||||
"ScraperError",
|
||||
"PartialDataError",
|
||||
# NBA
|
||||
"NBAScraper",
|
||||
"create_nba_scraper",
|
||||
# MLB
|
||||
"MLBScraper",
|
||||
"create_mlb_scraper",
|
||||
# NFL
|
||||
"NFLScraper",
|
||||
"create_nfl_scraper",
|
||||
# NHL
|
||||
"NHLScraper",
|
||||
"create_nhl_scraper",
|
||||
# MLS
|
||||
"MLSScraper",
|
||||
"create_mls_scraper",
|
||||
# WNBA
|
||||
"WNBAScraper",
|
||||
"create_wnba_scraper",
|
||||
# NWSL
|
||||
"NWSLScraper",
|
||||
"create_nwsl_scraper",
|
||||
]
|
||||
Reference in New Issue
Block a user