FOOTBALLDATALAKEHOUSE/
│
├── analytics/
│ └── sql_queries.sql
│ # Final business-grade SQL queries
│ # Used to generate KPIs, insights, and CSV exports
│
├── dashboards/
│ ├── Football Analytics.pbix
│ │ # Main Power BI dashboard file
│ │ # Interactive executive-level football analytics
│ │
│ └── Football Leagues Dashboard.png
│ # Snapshot of the Power BI dashboard
│ # Used for README previews and portfolio showcases
│
├── data_model/
│ ├── Model Relations.png
│ │ # Visual representation of fact & dimension relationships
│ │ # Shows star-schema style modeling
│ │
│ └── bi model
│ # Power BI semantic / data model configuration
│ # Measures, relationships, and calculated fields
│
├── data/
│ ├── bronze/
│ │ └── matches/
│ │ # Raw JSON match data ingested directly from the Football API
│ │ # Stored without transformation for full traceability
│ │
│ ├── silver/
│ │ └── matches/
│ │ └── matches_clean.parquet
│ │ # Cleaned and standardized match-level dataset
│ │ # Ready for analytical modeling
│ │
│ ├── gold/
│ │ ├── fact_matches.parquet
│ │ │ # Match-level fact table
│ │ │ # Grain: one row per match
│ │ │
│ │ ├── league_kpis.parquet
│ │ │ # Aggregated KPIs by competition and season
│ │ │
│ │ └── team_performance.parquet
│ │ # Team-level performance metrics
│ │ # (goals, goals conceded, goal difference, dominance)
│ │
│ └── exports/
│ # Business-ready KPI outputs generated from SQL
│ ├── kpi_score_intensity.csv
│ ├── kpi_home_advantage.csv
│ ├── kpi_top_teams.csv
│ ├── kpi_competitiveness_gap.csv
│ └── kpi_scoring_volatility.csv
│
├── ingestion/
│ └── fetch_matches.py
│ # API ingestion script
│ # Fetches match data by competition and season
│
├── transformation/
│ ├── clean_matches.py
│ │ # Transforms raw JSON into standardized Silver layer
│ │
│ └── build_gold.py
│ # Builds Gold-layer fact tables and business KPIs
│
├── notebooks/
│ └── validate_gold.py
│ # Data validation and quality checks
│
├── visuals/
│ # Executive-level visual outputs used in README and presentations
│ ├── score_intensity.png
│ ├── home_advantage.png
│ ├── top_teams.png
│ ├── competitiveness_gap.png
│ └── scoring_volatility.png
│
├── README.md
│ # Business-focused case study documentation
│
├── LICENSE
│ # MIT License
│
└── requirements.txt
# Python dependencies for reproducibility