{ "cells": [ { "cell_type": "markdown", "id": "81215b75-f5f8-4c17-9cd4-08b1b0ed4234", "metadata": {}, "source": [ "# Goal Expectancy\n", "\n", "Estimates the goal expectancy (the number of goals the bookmaker expects each team to score) based on their home, draw, away probabilities" ] }, { "cell_type": "code", "execution_count": 1, "id": "1f931497-c1f9-4cb4-969a-058676e42a24", "metadata": { "tags": [] }, "outputs": [], "source": [ "import penaltyblog as pb\n", "import pandas as pd" ] }, { "cell_type": "markdown", "id": "4a1b5c76-8f47-4f59-8351-d5add2f69309", "metadata": {}, "source": [ "## Get data from football-data.co.uk" ] }, { "cell_type": "code", "execution_count": 2, "id": "949b129d-e4e5-4975-8318-dd601d918e90", "metadata": { "tags": [] }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
team_hometeam_awaypshpsdpsa
id
1565308800---liverpool---norwichLiverpoolNorwich1.159.5918.05
1565395200---bournemouth---sheffield_unitedBournemouthSheffield United2.043.573.90
1565395200---burnley---southamptonBurnleySouthampton2.713.312.81
1565395200---crystal_palace---evertonCrystal PalaceEverton3.213.372.39
1565395200---tottenham---aston_villaTottenhamAston Villa1.305.8410.96
\n", "
" ], "text/plain": [ " team_home team_away \\\n", "id \n", "1565308800---liverpool---norwich Liverpool Norwich \n", "1565395200---bournemouth---sheffield_united Bournemouth Sheffield United \n", "1565395200---burnley---southampton Burnley Southampton \n", "1565395200---crystal_palace---everton Crystal Palace Everton \n", "1565395200---tottenham---aston_villa Tottenham Aston Villa \n", "\n", " psh psd psa \n", "id \n", "1565308800---liverpool---norwich 1.15 9.59 18.05 \n", "1565395200---bournemouth---sheffield_united 2.04 3.57 3.90 \n", "1565395200---burnley---southampton 2.71 3.31 2.81 \n", "1565395200---crystal_palace---everton 3.21 3.37 2.39 \n", "1565395200---tottenham---aston_villa 1.30 5.84 10.96 " ] }, "execution_count": 2, "metadata": {}, "output_type": "execute_result" } ], "source": [ "fb = pb.scrapers.FootballData(\"ENG Premier League\", \"2019-2020\")\n", "df = fb.get_fixtures()\n", "\n", "cols = [\"team_home\", \"team_away\", \"psh\", \"psd\", \"psa\"]\n", "df = df[cols]\n", "\n", "df.head()" ] }, { "cell_type": "markdown", "id": "faf4dd3f-34ca-4547-bcac-46d45ae2e1f2", "metadata": {}, "source": [ "## Remove the overround from the odds" ] }, { "cell_type": "code", "execution_count": 3, "id": "57093b8f-9725-4740-9a93-35da39171380", "metadata": { "tags": [] }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
team_hometeam_awaypshpsdpsahomedrawaway
id
1565308800---liverpool---norwichLiverpoolNorwich1.159.5918.050.8598180.0945280.045654
1565395200---bournemouth---sheffield_unitedBournemouthSheffield United2.043.573.900.4812900.2712060.247504
1565395200---burnley---southamptonBurnleySouthampton2.713.312.810.3600070.2931180.346875
1565395200---crystal_palace---evertonCrystal PalaceEverton3.213.372.390.3026360.2878450.409519
1565395200---tottenham---aston_villaTottenhamAston Villa1.305.8410.960.7586630.1606650.080673
\n", "
" ], "text/plain": [ " team_home team_away \\\n", "id \n", "1565308800---liverpool---norwich Liverpool Norwich \n", "1565395200---bournemouth---sheffield_united Bournemouth Sheffield United \n", "1565395200---burnley---southampton Burnley Southampton \n", "1565395200---crystal_palace---everton Crystal Palace Everton \n", "1565395200---tottenham---aston_villa Tottenham Aston Villa \n", "\n", " psh psd psa home \\\n", "id \n", "1565308800---liverpool---norwich 1.15 9.59 18.05 0.859818 \n", "1565395200---bournemouth---sheffield_united 2.04 3.57 3.90 0.481290 \n", "1565395200---burnley---southampton 2.71 3.31 2.81 0.360007 \n", "1565395200---crystal_palace---everton 3.21 3.37 2.39 0.302636 \n", "1565395200---tottenham---aston_villa 1.30 5.84 10.96 0.758663 \n", "\n", " draw away \n", "id \n", "1565308800---liverpool---norwich 0.094528 0.045654 \n", "1565395200---bournemouth---sheffield_united 0.271206 0.247504 \n", "1565395200---burnley---southampton 0.293118 0.346875 \n", "1565395200---crystal_palace---everton 0.287845 0.409519 \n", "1565395200---tottenham---aston_villa 0.160665 0.080673 " ] }, "execution_count": 3, "metadata": {}, "output_type": "execute_result" } ], "source": [ "def remove_overround(row):\n", " odds = [\n", " row[\"psh\"],\n", " row[\"psd\"],\n", " row[\"psa\"],\n", " ]\n", "\n", " odds = pb.implied.differential_margin_weighting(odds)\n", "\n", " return pd.Series(odds[\"implied_probabilities\"])\n", "\n", "\n", "df[[\"home\", \"draw\", \"away\"]] = df.apply(remove_overround, axis=1)\n", "\n", "df.head()" ] }, { "cell_type": "markdown", "id": "9257f0fc-5f2b-402f-9209-d005d14880be", "metadata": {}, "source": [ "## Get the goal expectancy" ] }, { "cell_type": "code", "execution_count": 4, "id": "6b8b7d83-273e-4ab1-bac0-b7387556a03f", "metadata": { "tags": [] }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
team_hometeam_awayhome_expectancyaway_expectancysuccesserror
0LiverpoolNorwich3.2199330.667064True5.381587e-09
1BournemouthSheffield United1.4035880.923020True5.932409e-11
2BurnleySouthampton1.0998761.073906True1.595460e-11
3Crystal PalaceEverton0.9999681.213245True6.410602e-11
4TottenhamAston Villa2.3128560.607438True1.123882e-10
\n", "
" ], "text/plain": [ " team_home team_away home_expectancy away_expectancy \\\n", "0 Liverpool Norwich 3.219933 0.667064 \n", "1 Bournemouth Sheffield United 1.403588 0.923020 \n", "2 Burnley Southampton 1.099876 1.073906 \n", "3 Crystal Palace Everton 0.999968 1.213245 \n", "4 Tottenham Aston Villa 2.312856 0.607438 \n", "\n", " success error \n", "0 True 5.381587e-09 \n", "1 True 5.932409e-11 \n", "2 True 1.595460e-11 \n", "3 True 6.410602e-11 \n", "4 True 1.123882e-10 " ] }, "execution_count": 4, "metadata": {}, "output_type": "execute_result" } ], "source": [ "output = list()\n", "for idx, row in df.head().iterrows():\n", " res = pb.models.goal_expectancy(row[\"home\"], row[\"draw\"], row[\"away\"])\n", "\n", " tmp = {\n", " \"team_home\": row[\"team_home\"],\n", " \"team_away\": row[\"team_away\"],\n", " \"home_expectancy\": res[\"home_exp\"],\n", " \"away_expectancy\": res[\"away_exp\"],\n", " \"success\": res[\"success\"],\n", " \"error\": res[\"error\"],\n", " }\n", "\n", " output.append(tmp)\n", "\n", "output = pd.DataFrame(output)\n", "output" ] }, { "cell_type": "code", "execution_count": null, "id": "e5997054-9134-43e3-9d08-797c183fe642", "metadata": {}, "outputs": [], "source": [] } ], "metadata": { "kernelspec": { "display_name": "venv", "language": "python", "name": "python3" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.13.1" } }, "nbformat": 4, "nbformat_minor": 5 }