{ "cells": [ { "cell_type": "markdown", "id": "fdfeabe5-ff98-444e-a107-de870427f5f5", "metadata": {}, "source": [ "# football-data.co.uk" ] }, { "cell_type": "code", "execution_count": 1, "id": "01177c79-baa8-4f27-a3f3-4c8e2737c563", "metadata": { "tags": [] }, "outputs": [], "source": [ "import sys\n", "\n", "sys.path.append(\"../../\")\n", "\n", "import penaltyblog as pb" ] }, { "cell_type": "markdown", "id": "d2787af4-680c-4fdf-835c-082602443172", "metadata": {}, "source": [ "### List the available countries to download data for" ] }, { "cell_type": "code", "execution_count": 2, "id": "6c0c661b-9ae2-4c41-a354-5f9ab6870f28", "metadata": { "tags": [] }, "outputs": [ { "data": { "text/plain": [ "['BEL First Division A',\n", " 'DEU Bundesliga 1',\n", " 'DEU Bundesliga 2',\n", " 'ENG Premier League',\n", " 'ENG Championship',\n", " 'ENG League 1',\n", " 'ENG League 2',\n", " 'ENG Conference',\n", " 'ESP La Liga',\n", " 'ESP La Liga Segunda',\n", " 'FRA Ligue 1',\n", " 'FRA Ligue 2',\n", " 'GRC Super League',\n", " 'ITA Serie A',\n", " 'ITA Serie B',\n", " 'NLD Eredivisie',\n", " 'PRT Liga 1',\n", " 'SCO Premier League',\n", " 'SCO Division 1',\n", " 'SCO Division 2',\n", " 'SCO Division 3',\n", " 'TUR Super Lig']" ] }, "execution_count": 2, "metadata": {}, "output_type": "execute_result" } ], "source": [ "pb.scrapers.FootballData.list_competitions()" ] }, { "cell_type": "markdown", "id": "9be833ab-9653-402c-8dd9-decaeffe39d1", "metadata": {}, "source": [ "### Download the data for the English Premier League" ] }, { "cell_type": "code", "execution_count": 3, "id": "dd11c0a6-3ed1-4131-9dbb-020c89ce066c", "metadata": { "tags": [] }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
datedatetimeseasoncompetitiondivtimeteam_hometeam_awayfthgftag...b365_cahhb365_cahapcahhpcahamax_cahhmax_cahaavg_cahhavg_cahagoals_homegoals_away
id
1628812800---brentford---arsenal2021-08-132021-08-13 20:00:002021-2022ENG Premier LeagueE020:00BrentfordArsenal20...1.752.051.812.132.052.171.802.0920
1628899200---burnley---brighton2021-08-142021-08-14 15:00:002021-2022ENG Premier LeagueE015:00BurnleyBrighton12...1.792.151.812.141.822.191.792.1212
1628899200---chelsea---crystal_palace2021-08-142021-08-14 15:00:002021-2022ENG Premier LeagueE015:00ChelseaCrystal Palace30...2.051.752.121.812.161.932.061.8230
1628899200---everton---southampton2021-08-142021-08-14 15:00:002021-2022ENG Premier LeagueE015:00EvertonSouthampton31...2.051.882.051.882.081.902.031.8631
1628899200---leicester---wolves2021-08-142021-08-14 15:00:002021-2022ENG Premier LeagueE015:00LeicesterWolves10...2.021.912.011.922.051.951.991.8910
\n", "

5 rows × 111 columns

\n", "
" ], "text/plain": [ " date datetime \\\n", "id \n", "1628812800---brentford---arsenal 2021-08-13 2021-08-13 20:00:00 \n", "1628899200---burnley---brighton 2021-08-14 2021-08-14 15:00:00 \n", "1628899200---chelsea---crystal_palace 2021-08-14 2021-08-14 15:00:00 \n", "1628899200---everton---southampton 2021-08-14 2021-08-14 15:00:00 \n", "1628899200---leicester---wolves 2021-08-14 2021-08-14 15:00:00 \n", "\n", " season competition div \\\n", "id \n", "1628812800---brentford---arsenal 2021-2022 ENG Premier League E0 \n", "1628899200---burnley---brighton 2021-2022 ENG Premier League E0 \n", "1628899200---chelsea---crystal_palace 2021-2022 ENG Premier League E0 \n", "1628899200---everton---southampton 2021-2022 ENG Premier League E0 \n", "1628899200---leicester---wolves 2021-2022 ENG Premier League E0 \n", "\n", " time team_home team_away fthg \\\n", "id \n", "1628812800---brentford---arsenal 20:00 Brentford Arsenal 2 \n", "1628899200---burnley---brighton 15:00 Burnley Brighton 1 \n", "1628899200---chelsea---crystal_palace 15:00 Chelsea Crystal Palace 3 \n", "1628899200---everton---southampton 15:00 Everton Southampton 3 \n", "1628899200---leicester---wolves 15:00 Leicester Wolves 1 \n", "\n", " ftag ... b365_cahh b365_caha pcahh \\\n", "id ... \n", "1628812800---brentford---arsenal 0 ... 1.75 2.05 1.81 \n", "1628899200---burnley---brighton 2 ... 1.79 2.15 1.81 \n", "1628899200---chelsea---crystal_palace 0 ... 2.05 1.75 2.12 \n", "1628899200---everton---southampton 1 ... 2.05 1.88 2.05 \n", "1628899200---leicester---wolves 0 ... 2.02 1.91 2.01 \n", "\n", " pcaha max_cahh max_caha avg_cahh \\\n", "id \n", "1628812800---brentford---arsenal 2.13 2.05 2.17 1.80 \n", "1628899200---burnley---brighton 2.14 1.82 2.19 1.79 \n", "1628899200---chelsea---crystal_palace 1.81 2.16 1.93 2.06 \n", "1628899200---everton---southampton 1.88 2.08 1.90 2.03 \n", "1628899200---leicester---wolves 1.92 2.05 1.95 1.99 \n", "\n", " avg_caha goals_home goals_away \n", "id \n", "1628812800---brentford---arsenal 2.09 2 0 \n", "1628899200---burnley---brighton 2.12 1 2 \n", "1628899200---chelsea---crystal_palace 1.82 3 0 \n", "1628899200---everton---southampton 1.86 3 1 \n", "1628899200---leicester---wolves 1.89 1 0 \n", "\n", "[5 rows x 111 columns]" ] }, "execution_count": 3, "metadata": {}, "output_type": "execute_result" } ], "source": [ "fb = pb.scrapers.FootballData(\"ENG Premier League\", \"2021-2022\")\n", "df = fb.get_fixtures()\n", "\n", "df.head()" ] }, { "cell_type": "markdown", "id": "d1517234-e0c2-4718-aa84-2a9cacfaa81f", "metadata": {}, "source": [ "### Download the data for the English Premier League and map team names" ] }, { "cell_type": "code", "execution_count": 4, "id": "20190a0b-f01e-437d-ab3e-fc6ff701cceb", "metadata": { "tags": [] }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
datedatetimeseasoncompetitiondivtimeteam_hometeam_awayfthgftag...b365_cahhb365_cahapcahhpcahamax_cahhmax_cahaavg_cahhavg_cahagoals_homegoals_away
id
1628812800---brentford---arsenal2021-08-132021-08-13 20:00:002021-2022ENG Premier LeagueE020:00BrentfordArsenal20...1.752.051.812.132.052.171.802.0920
1628899200---burnley---brighton2021-08-142021-08-14 15:00:002021-2022ENG Premier LeagueE015:00BurnleyBrighton12...1.792.151.812.141.822.191.792.1212
1628899200---chelsea---crystal_palace2021-08-142021-08-14 15:00:002021-2022ENG Premier LeagueE015:00ChelseaCrystal Palace30...2.051.752.121.812.161.932.061.8230
1628899200---everton---southampton2021-08-142021-08-14 15:00:002021-2022ENG Premier LeagueE015:00EvertonSouthampton31...2.051.882.051.882.081.902.031.8631
1628899200---leicester_city---wolverhampton_wanderers2021-08-142021-08-14 15:00:002021-2022ENG Premier LeagueE015:00Leicester CityWolverhampton Wanderers10...2.021.912.011.922.051.951.991.8910
\n", "

5 rows × 111 columns

\n", "
" ], "text/plain": [ " date \\\n", "id \n", "1628812800---brentford---arsenal 2021-08-13 \n", "1628899200---burnley---brighton 2021-08-14 \n", "1628899200---chelsea---crystal_palace 2021-08-14 \n", "1628899200---everton---southampton 2021-08-14 \n", "1628899200---leicester_city---wolverhampton_wan... 2021-08-14 \n", "\n", " datetime \\\n", "id \n", "1628812800---brentford---arsenal 2021-08-13 20:00:00 \n", "1628899200---burnley---brighton 2021-08-14 15:00:00 \n", "1628899200---chelsea---crystal_palace 2021-08-14 15:00:00 \n", "1628899200---everton---southampton 2021-08-14 15:00:00 \n", "1628899200---leicester_city---wolverhampton_wan... 2021-08-14 15:00:00 \n", "\n", " season \\\n", "id \n", "1628812800---brentford---arsenal 2021-2022 \n", "1628899200---burnley---brighton 2021-2022 \n", "1628899200---chelsea---crystal_palace 2021-2022 \n", "1628899200---everton---southampton 2021-2022 \n", "1628899200---leicester_city---wolverhampton_wan... 2021-2022 \n", "\n", " competition div \\\n", "id \n", "1628812800---brentford---arsenal ENG Premier League E0 \n", "1628899200---burnley---brighton ENG Premier League E0 \n", "1628899200---chelsea---crystal_palace ENG Premier League E0 \n", "1628899200---everton---southampton ENG Premier League E0 \n", "1628899200---leicester_city---wolverhampton_wan... ENG Premier League E0 \n", "\n", " time team_home \\\n", "id \n", "1628812800---brentford---arsenal 20:00 Brentford \n", "1628899200---burnley---brighton 15:00 Burnley \n", "1628899200---chelsea---crystal_palace 15:00 Chelsea \n", "1628899200---everton---southampton 15:00 Everton \n", "1628899200---leicester_city---wolverhampton_wan... 15:00 Leicester City \n", "\n", " team_away \\\n", "id \n", "1628812800---brentford---arsenal Arsenal \n", "1628899200---burnley---brighton Brighton \n", "1628899200---chelsea---crystal_palace Crystal Palace \n", "1628899200---everton---southampton Southampton \n", "1628899200---leicester_city---wolverhampton_wan... Wolverhampton Wanderers \n", "\n", " fthg ftag ... b365_cahh \\\n", "id ... \n", "1628812800---brentford---arsenal 2 0 ... 1.75 \n", "1628899200---burnley---brighton 1 2 ... 1.79 \n", "1628899200---chelsea---crystal_palace 3 0 ... 2.05 \n", "1628899200---everton---southampton 3 1 ... 2.05 \n", "1628899200---leicester_city---wolverhampton_wan... 1 0 ... 2.02 \n", "\n", " b365_caha pcahh pcaha \\\n", "id \n", "1628812800---brentford---arsenal 2.05 1.81 2.13 \n", "1628899200---burnley---brighton 2.15 1.81 2.14 \n", "1628899200---chelsea---crystal_palace 1.75 2.12 1.81 \n", "1628899200---everton---southampton 1.88 2.05 1.88 \n", "1628899200---leicester_city---wolverhampton_wan... 1.91 2.01 1.92 \n", "\n", " max_cahh max_caha \\\n", "id \n", "1628812800---brentford---arsenal 2.05 2.17 \n", "1628899200---burnley---brighton 1.82 2.19 \n", "1628899200---chelsea---crystal_palace 2.16 1.93 \n", "1628899200---everton---southampton 2.08 1.90 \n", "1628899200---leicester_city---wolverhampton_wan... 2.05 1.95 \n", "\n", " avg_cahh avg_caha \\\n", "id \n", "1628812800---brentford---arsenal 1.80 2.09 \n", "1628899200---burnley---brighton 1.79 2.12 \n", "1628899200---chelsea---crystal_palace 2.06 1.82 \n", "1628899200---everton---southampton 2.03 1.86 \n", "1628899200---leicester_city---wolverhampton_wan... 1.99 1.89 \n", "\n", " goals_home goals_away \n", "id \n", "1628812800---brentford---arsenal 2 0 \n", "1628899200---burnley---brighton 1 2 \n", "1628899200---chelsea---crystal_palace 3 0 \n", "1628899200---everton---southampton 3 1 \n", "1628899200---leicester_city---wolverhampton_wan... 1 0 \n", "\n", "[5 rows x 111 columns]" ] }, "execution_count": 4, "metadata": {}, "output_type": "execute_result" } ], "source": [ "team_mappings = pb.scrapers.get_example_team_name_mappings()\n", "\n", "fb = pb.scrapers.FootballData(\"ENG Premier League\", \"2021-2022\", team_mappings)\n", "df = fb.get_fixtures()\n", "\n", "df.head()" ] }, { "cell_type": "code", "execution_count": null, "id": "04e054d3-1c05-4c51-b175-efd574f7a4d9", "metadata": {}, "outputs": [], "source": [] } ], "metadata": { "kernelspec": { "display_name": "Python 3 (ipykernel)", "language": "python", "name": "python3" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.13.0" } }, "nbformat": 4, "nbformat_minor": 5 }