From 1180cf86cc40708981df3deebe017e873dc87e2f Mon Sep 17 00:00:00 2001
From: aditya desle <50102208+adityadesle@users.noreply.github.com>
Date: Fri, 2 Oct 2020 20:35:46 +0530
Subject: [PATCH 1/2] Update README.md
---
README.md | 1 +
1 file changed, 1 insertion(+)
diff --git a/README.md b/README.md
index fc61313..c34dbdc 100644
--- a/README.md
+++ b/README.md
@@ -16,6 +16,7 @@ Course topics include:
* Fundamentals of Python and its data types
* Data analysis packages Numpy and Pandas
* Plotting packages Matplotlib and Seaborn
+* Example of data analysis : Uber raw data analysis report
* Statistics
* Regular expressions
* Interactive visualization
From d0dde4910a169aa31f1e7f37e259ba1d412930b0 Mon Sep 17 00:00:00 2001
From: aditya desle <50102208+adityadesle@users.noreply.github.com>
Date: Fri, 2 Oct 2020 20:36:12 +0530
Subject: [PATCH 2/2] Add files via upload
---
Uber_data.ipynb | 1829 +++++++++++++++++++++++++++++++++++++++++++++++
1 file changed, 1829 insertions(+)
create mode 100644 Uber_data.ipynb
diff --git a/Uber_data.ipynb b/Uber_data.ipynb
new file mode 100644
index 0000000..4976042
--- /dev/null
+++ b/Uber_data.ipynb
@@ -0,0 +1,1829 @@
+{
+ "cells": [
+ {
+ "cell_type": "code",
+ "execution_count": 1,
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "Populating the interactive namespace from numpy and matplotlib\n"
+ ]
+ }
+ ],
+ "source": [
+ "%pylab inline\n",
+ "import pandas as pd\n",
+ "import seaborn as sb"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 2,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "\n",
+ "data = pd.read_csv('uber-raw-data-apr14.csv')"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 3,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "
\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " Date/Time | \n",
+ " Lat | \n",
+ " Lon | \n",
+ " Base | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " | 0 | \n",
+ " 4/1/2014 0:11:00 | \n",
+ " 40.7690 | \n",
+ " -73.9549 | \n",
+ " B02512 | \n",
+ "
\n",
+ " \n",
+ " | 1 | \n",
+ " 4/1/2014 0:17:00 | \n",
+ " 40.7267 | \n",
+ " -74.0345 | \n",
+ " B02512 | \n",
+ "
\n",
+ " \n",
+ " | 2 | \n",
+ " 4/1/2014 0:21:00 | \n",
+ " 40.7316 | \n",
+ " -73.9873 | \n",
+ " B02512 | \n",
+ "
\n",
+ " \n",
+ " | 3 | \n",
+ " 4/1/2014 0:28:00 | \n",
+ " 40.7588 | \n",
+ " -73.9776 | \n",
+ " B02512 | \n",
+ "
\n",
+ " \n",
+ " | 4 | \n",
+ " 4/1/2014 0:33:00 | \n",
+ " 40.7594 | \n",
+ " -73.9722 | \n",
+ " B02512 | \n",
+ "
\n",
+ " \n",
+ " | ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " | 564511 | \n",
+ " 4/30/2014 23:22:00 | \n",
+ " 40.7640 | \n",
+ " -73.9744 | \n",
+ " B02764 | \n",
+ "
\n",
+ " \n",
+ " | 564512 | \n",
+ " 4/30/2014 23:26:00 | \n",
+ " 40.7629 | \n",
+ " -73.9672 | \n",
+ " B02764 | \n",
+ "
\n",
+ " \n",
+ " | 564513 | \n",
+ " 4/30/2014 23:31:00 | \n",
+ " 40.7443 | \n",
+ " -73.9889 | \n",
+ " B02764 | \n",
+ "
\n",
+ " \n",
+ " | 564514 | \n",
+ " 4/30/2014 23:32:00 | \n",
+ " 40.6756 | \n",
+ " -73.9405 | \n",
+ " B02764 | \n",
+ "
\n",
+ " \n",
+ " | 564515 | \n",
+ " 4/30/2014 23:48:00 | \n",
+ " 40.6880 | \n",
+ " -73.9608 | \n",
+ " B02764 | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
564516 rows × 4 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " Date/Time Lat Lon Base\n",
+ "0 4/1/2014 0:11:00 40.7690 -73.9549 B02512\n",
+ "1 4/1/2014 0:17:00 40.7267 -74.0345 B02512\n",
+ "2 4/1/2014 0:21:00 40.7316 -73.9873 B02512\n",
+ "3 4/1/2014 0:28:00 40.7588 -73.9776 B02512\n",
+ "4 4/1/2014 0:33:00 40.7594 -73.9722 B02512\n",
+ "... ... ... ... ...\n",
+ "564511 4/30/2014 23:22:00 40.7640 -73.9744 B02764\n",
+ "564512 4/30/2014 23:26:00 40.7629 -73.9672 B02764\n",
+ "564513 4/30/2014 23:31:00 40.7443 -73.9889 B02764\n",
+ "564514 4/30/2014 23:32:00 40.6756 -73.9405 B02764\n",
+ "564515 4/30/2014 23:48:00 40.6880 -73.9608 B02764\n",
+ "\n",
+ "[564516 rows x 4 columns]"
+ ]
+ },
+ "execution_count": 3,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "data"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 4,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "(564516, 4)"
+ ]
+ },
+ "execution_count": 4,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "data.shape"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 5,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "\n",
+ "data['Date/Time'] = pd.to_datetime(data['Date/Time'])"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 6,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "'Tuesday'"
+ ]
+ },
+ "execution_count": 6,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "data['Date/Time'][0].day_name()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 7,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "0 Tuesday\n",
+ "1 Tuesday\n",
+ "2 Tuesday\n",
+ "3 Tuesday\n",
+ "4 Tuesday\n",
+ " ... \n",
+ "564511 Wednesday\n",
+ "564512 Wednesday\n",
+ "564513 Wednesday\n",
+ "564514 Wednesday\n",
+ "564515 Wednesday\n",
+ "Name: Date/Time, Length: 564516, dtype: object"
+ ]
+ },
+ "execution_count": 7,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "data['Date/Time'].dt.day_name()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 8,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "data['Daysofweek'] = data['Date/Time'].dt.day_name()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 9,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " Date/Time | \n",
+ " Lat | \n",
+ " Lon | \n",
+ " Base | \n",
+ " Daysofweek | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " | 0 | \n",
+ " 2014-04-01 00:11:00 | \n",
+ " 40.7690 | \n",
+ " -73.9549 | \n",
+ " B02512 | \n",
+ " Tuesday | \n",
+ "
\n",
+ " \n",
+ " | 1 | \n",
+ " 2014-04-01 00:17:00 | \n",
+ " 40.7267 | \n",
+ " -74.0345 | \n",
+ " B02512 | \n",
+ " Tuesday | \n",
+ "
\n",
+ " \n",
+ " | 2 | \n",
+ " 2014-04-01 00:21:00 | \n",
+ " 40.7316 | \n",
+ " -73.9873 | \n",
+ " B02512 | \n",
+ " Tuesday | \n",
+ "
\n",
+ " \n",
+ " | 3 | \n",
+ " 2014-04-01 00:28:00 | \n",
+ " 40.7588 | \n",
+ " -73.9776 | \n",
+ " B02512 | \n",
+ " Tuesday | \n",
+ "
\n",
+ " \n",
+ " | 4 | \n",
+ " 2014-04-01 00:33:00 | \n",
+ " 40.7594 | \n",
+ " -73.9722 | \n",
+ " B02512 | \n",
+ " Tuesday | \n",
+ "
\n",
+ " \n",
+ " | ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " | 564511 | \n",
+ " 2014-04-30 23:22:00 | \n",
+ " 40.7640 | \n",
+ " -73.9744 | \n",
+ " B02764 | \n",
+ " Wednesday | \n",
+ "
\n",
+ " \n",
+ " | 564512 | \n",
+ " 2014-04-30 23:26:00 | \n",
+ " 40.7629 | \n",
+ " -73.9672 | \n",
+ " B02764 | \n",
+ " Wednesday | \n",
+ "
\n",
+ " \n",
+ " | 564513 | \n",
+ " 2014-04-30 23:31:00 | \n",
+ " 40.7443 | \n",
+ " -73.9889 | \n",
+ " B02764 | \n",
+ " Wednesday | \n",
+ "
\n",
+ " \n",
+ " | 564514 | \n",
+ " 2014-04-30 23:32:00 | \n",
+ " 40.6756 | \n",
+ " -73.9405 | \n",
+ " B02764 | \n",
+ " Wednesday | \n",
+ "
\n",
+ " \n",
+ " | 564515 | \n",
+ " 2014-04-30 23:48:00 | \n",
+ " 40.6880 | \n",
+ " -73.9608 | \n",
+ " B02764 | \n",
+ " Wednesday | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
564516 rows × 5 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " Date/Time Lat Lon Base Daysofweek\n",
+ "0 2014-04-01 00:11:00 40.7690 -73.9549 B02512 Tuesday\n",
+ "1 2014-04-01 00:17:00 40.7267 -74.0345 B02512 Tuesday\n",
+ "2 2014-04-01 00:21:00 40.7316 -73.9873 B02512 Tuesday\n",
+ "3 2014-04-01 00:28:00 40.7588 -73.9776 B02512 Tuesday\n",
+ "4 2014-04-01 00:33:00 40.7594 -73.9722 B02512 Tuesday\n",
+ "... ... ... ... ... ...\n",
+ "564511 2014-04-30 23:22:00 40.7640 -73.9744 B02764 Wednesday\n",
+ "564512 2014-04-30 23:26:00 40.7629 -73.9672 B02764 Wednesday\n",
+ "564513 2014-04-30 23:31:00 40.7443 -73.9889 B02764 Wednesday\n",
+ "564514 2014-04-30 23:32:00 40.6756 -73.9405 B02764 Wednesday\n",
+ "564515 2014-04-30 23:48:00 40.6880 -73.9608 B02764 Wednesday\n",
+ "\n",
+ "[564516 rows x 5 columns]"
+ ]
+ },
+ "execution_count": 9,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "data"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 10,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "14"
+ ]
+ },
+ "execution_count": 10,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "data['Date/Time'][0].week"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 11,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "0 2014-04-01 00:11:00\n",
+ "1 2014-04-01 00:17:00\n",
+ "2 2014-04-01 00:21:00\n",
+ "3 2014-04-01 00:28:00\n",
+ "4 2014-04-01 00:33:00\n",
+ " ... \n",
+ "564511 2014-04-30 23:22:00\n",
+ "564512 2014-04-30 23:26:00\n",
+ "564513 2014-04-30 23:31:00\n",
+ "564514 2014-04-30 23:32:00\n",
+ "564515 2014-04-30 23:48:00\n",
+ "Name: Date/Time, Length: 564516, dtype: datetime64[ns]"
+ ]
+ },
+ "execution_count": 11,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "data['Date/Time']"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 12,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " Date/Time | \n",
+ " Lat | \n",
+ " Lon | \n",
+ " Base | \n",
+ " Daysofweek | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " | 564511 | \n",
+ " 2014-04-30 23:22:00 | \n",
+ " 40.7640 | \n",
+ " -73.9744 | \n",
+ " B02764 | \n",
+ " Wednesday | \n",
+ "
\n",
+ " \n",
+ " | 564512 | \n",
+ " 2014-04-30 23:26:00 | \n",
+ " 40.7629 | \n",
+ " -73.9672 | \n",
+ " B02764 | \n",
+ " Wednesday | \n",
+ "
\n",
+ " \n",
+ " | 564513 | \n",
+ " 2014-04-30 23:31:00 | \n",
+ " 40.7443 | \n",
+ " -73.9889 | \n",
+ " B02764 | \n",
+ " Wednesday | \n",
+ "
\n",
+ " \n",
+ " | 564514 | \n",
+ " 2014-04-30 23:32:00 | \n",
+ " 40.6756 | \n",
+ " -73.9405 | \n",
+ " B02764 | \n",
+ " Wednesday | \n",
+ "
\n",
+ " \n",
+ " | 564515 | \n",
+ " 2014-04-30 23:48:00 | \n",
+ " 40.6880 | \n",
+ " -73.9608 | \n",
+ " B02764 | \n",
+ " Wednesday | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
"
+ ],
+ "text/plain": [
+ " Date/Time Lat Lon Base Daysofweek\n",
+ "564511 2014-04-30 23:22:00 40.7640 -73.9744 B02764 Wednesday\n",
+ "564512 2014-04-30 23:26:00 40.7629 -73.9672 B02764 Wednesday\n",
+ "564513 2014-04-30 23:31:00 40.7443 -73.9889 B02764 Wednesday\n",
+ "564514 2014-04-30 23:32:00 40.6756 -73.9405 B02764 Wednesday\n",
+ "564515 2014-04-30 23:48:00 40.6880 -73.9608 B02764 Wednesday"
+ ]
+ },
+ "execution_count": 12,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "data.tail()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 29,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "def get_day(dt):\n",
+ " return dt.day\n",
+ "\n",
+ "data[\"DoM\"] = data['Date/Time'].map(get_day)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 50,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "def get_hour(dt):\n",
+ " return dt.hour\n",
+ "\n",
+ "data['Hour'] = data['Date/Time'].map(get_hour)\n",
+ "\n",
+ "def get_week(dt):\n",
+ " return dt.weekday()\n",
+ "\n",
+ "data['Weekday'] = data['Date/Time'].map(get_week)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 51,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " Date/Time | \n",
+ " Lat | \n",
+ " Lon | \n",
+ " Base | \n",
+ " Daysofweek | \n",
+ " DoM | \n",
+ " Hour | \n",
+ " Week | \n",
+ " Weekday | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " | 0 | \n",
+ " 2014-04-01 00:11:00 | \n",
+ " 40.7690 | \n",
+ " -73.9549 | \n",
+ " B02512 | \n",
+ " Tuesday | \n",
+ " 1 | \n",
+ " 0 | \n",
+ " 14 | \n",
+ " 1 | \n",
+ "
\n",
+ " \n",
+ " | 1 | \n",
+ " 2014-04-01 00:17:00 | \n",
+ " 40.7267 | \n",
+ " -74.0345 | \n",
+ " B02512 | \n",
+ " Tuesday | \n",
+ " 1 | \n",
+ " 0 | \n",
+ " 14 | \n",
+ " 1 | \n",
+ "
\n",
+ " \n",
+ " | 2 | \n",
+ " 2014-04-01 00:21:00 | \n",
+ " 40.7316 | \n",
+ " -73.9873 | \n",
+ " B02512 | \n",
+ " Tuesday | \n",
+ " 1 | \n",
+ " 0 | \n",
+ " 14 | \n",
+ " 1 | \n",
+ "
\n",
+ " \n",
+ " | 3 | \n",
+ " 2014-04-01 00:28:00 | \n",
+ " 40.7588 | \n",
+ " -73.9776 | \n",
+ " B02512 | \n",
+ " Tuesday | \n",
+ " 1 | \n",
+ " 0 | \n",
+ " 14 | \n",
+ " 1 | \n",
+ "
\n",
+ " \n",
+ " | 4 | \n",
+ " 2014-04-01 00:33:00 | \n",
+ " 40.7594 | \n",
+ " -73.9722 | \n",
+ " B02512 | \n",
+ " Tuesday | \n",
+ " 1 | \n",
+ " 0 | \n",
+ " 14 | \n",
+ " 1 | \n",
+ "
\n",
+ " \n",
+ " | ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " | 564511 | \n",
+ " 2014-04-30 23:22:00 | \n",
+ " 40.7640 | \n",
+ " -73.9744 | \n",
+ " B02764 | \n",
+ " Wednesday | \n",
+ " 30 | \n",
+ " 23 | \n",
+ " 18 | \n",
+ " 2 | \n",
+ "
\n",
+ " \n",
+ " | 564512 | \n",
+ " 2014-04-30 23:26:00 | \n",
+ " 40.7629 | \n",
+ " -73.9672 | \n",
+ " B02764 | \n",
+ " Wednesday | \n",
+ " 30 | \n",
+ " 23 | \n",
+ " 18 | \n",
+ " 2 | \n",
+ "
\n",
+ " \n",
+ " | 564513 | \n",
+ " 2014-04-30 23:31:00 | \n",
+ " 40.7443 | \n",
+ " -73.9889 | \n",
+ " B02764 | \n",
+ " Wednesday | \n",
+ " 30 | \n",
+ " 23 | \n",
+ " 18 | \n",
+ " 2 | \n",
+ "
\n",
+ " \n",
+ " | 564514 | \n",
+ " 2014-04-30 23:32:00 | \n",
+ " 40.6756 | \n",
+ " -73.9405 | \n",
+ " B02764 | \n",
+ " Wednesday | \n",
+ " 30 | \n",
+ " 23 | \n",
+ " 18 | \n",
+ " 2 | \n",
+ "
\n",
+ " \n",
+ " | 564515 | \n",
+ " 2014-04-30 23:48:00 | \n",
+ " 40.6880 | \n",
+ " -73.9608 | \n",
+ " B02764 | \n",
+ " Wednesday | \n",
+ " 30 | \n",
+ " 23 | \n",
+ " 18 | \n",
+ " 2 | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
564516 rows × 9 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " Date/Time Lat Lon Base Daysofweek DoM Hour \\\n",
+ "0 2014-04-01 00:11:00 40.7690 -73.9549 B02512 Tuesday 1 0 \n",
+ "1 2014-04-01 00:17:00 40.7267 -74.0345 B02512 Tuesday 1 0 \n",
+ "2 2014-04-01 00:21:00 40.7316 -73.9873 B02512 Tuesday 1 0 \n",
+ "3 2014-04-01 00:28:00 40.7588 -73.9776 B02512 Tuesday 1 0 \n",
+ "4 2014-04-01 00:33:00 40.7594 -73.9722 B02512 Tuesday 1 0 \n",
+ "... ... ... ... ... ... ... ... \n",
+ "564511 2014-04-30 23:22:00 40.7640 -73.9744 B02764 Wednesday 30 23 \n",
+ "564512 2014-04-30 23:26:00 40.7629 -73.9672 B02764 Wednesday 30 23 \n",
+ "564513 2014-04-30 23:31:00 40.7443 -73.9889 B02764 Wednesday 30 23 \n",
+ "564514 2014-04-30 23:32:00 40.6756 -73.9405 B02764 Wednesday 30 23 \n",
+ "564515 2014-04-30 23:48:00 40.6880 -73.9608 B02764 Wednesday 30 23 \n",
+ "\n",
+ " Week Weekday \n",
+ "0 14 1 \n",
+ "1 14 1 \n",
+ "2 14 1 \n",
+ "3 14 1 \n",
+ "4 14 1 \n",
+ "... ... ... \n",
+ "564511 18 2 \n",
+ "564512 18 2 \n",
+ "564513 18 2 \n",
+ "564514 18 2 \n",
+ "564515 18 2 \n",
+ "\n",
+ "[564516 rows x 9 columns]"
+ ]
+ },
+ "execution_count": 51,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "data"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 21,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "Text(0.5, 1.0, 'Frequency of Uber - Apr - 2014')"
+ ]
+ },
+ "execution_count": 21,
+ "metadata": {},
+ "output_type": "execute_result"
+ },
+ {
+ "data": {
+ "image/png": "\n",
+ "text/plain": [
+ ""
+ ]
+ },
+ "metadata": {
+ "needs_background": "light"
+ },
+ "output_type": "display_data"
+ }
+ ],
+ "source": [
+ "hist(data.DoM , bins = 30 , rwidth = 0.8)\n",
+ "xlabel('Date of the month')\n",
+ "ylabel('frequency')\n",
+ "title('Frequency of Uber - Apr - 2014')"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 18,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "[]"
+ ]
+ },
+ "execution_count": 18,
+ "metadata": {},
+ "output_type": "execute_result"
+ },
+ {
+ "data": {
+ "image/png": "\n",
+ "text/plain": [
+ ""
+ ]
+ },
+ "metadata": {
+ "needs_background": "light"
+ },
+ "output_type": "display_data"
+ }
+ ],
+ "source": [
+ "plot(data.DoM)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 24,
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "(1, 14546)\n",
+ "(2, 17474)\n",
+ "(3, 20701)\n",
+ "(4, 26714)\n",
+ "(5, 19521)\n",
+ "(6, 13445)\n",
+ "(7, 19550)\n",
+ "(8, 16188)\n",
+ "(9, 16843)\n",
+ "(10, 20041)\n",
+ "(11, 20420)\n",
+ "(12, 18170)\n",
+ "(13, 12112)\n",
+ "(14, 12674)\n",
+ "(15, 20641)\n",
+ "(16, 17717)\n",
+ "(17, 20973)\n",
+ "(18, 18074)\n",
+ "(19, 14602)\n",
+ "(20, 11017)\n",
+ "(21, 13162)\n",
+ "(22, 16975)\n",
+ "(23, 20346)\n",
+ "(24, 23352)\n",
+ "(25, 25095)\n",
+ "(26, 24925)\n",
+ "(27, 14677)\n",
+ "(28, 15475)\n",
+ "(29, 22835)\n",
+ "(30, 36251)\n"
+ ]
+ }
+ ],
+ "source": [
+ "for k , row in data.groupby('DoM'):\n",
+ " print ((k,len(row)))"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 25,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "DoM\n",
+ "1 14546\n",
+ "2 17474\n",
+ "3 20701\n",
+ "4 26714\n",
+ "5 19521\n",
+ "6 13445\n",
+ "7 19550\n",
+ "8 16188\n",
+ "9 16843\n",
+ "10 20041\n",
+ "11 20420\n",
+ "12 18170\n",
+ "13 12112\n",
+ "14 12674\n",
+ "15 20641\n",
+ "16 17717\n",
+ "17 20973\n",
+ "18 18074\n",
+ "19 14602\n",
+ "20 11017\n",
+ "21 13162\n",
+ "22 16975\n",
+ "23 20346\n",
+ "24 23352\n",
+ "25 25095\n",
+ "26 24925\n",
+ "27 14677\n",
+ "28 15475\n",
+ "29 22835\n",
+ "30 36251\n",
+ "dtype: int64"
+ ]
+ },
+ "execution_count": 25,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "def count(row):\n",
+ " return(len(row))\n",
+ "\n",
+ "by_date = data.groupby('DoM').apply(count)\n",
+ "by_date"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 26,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "[]"
+ ]
+ },
+ "execution_count": 26,
+ "metadata": {},
+ "output_type": "execute_result"
+ },
+ {
+ "data": {
+ "image/png": "\n",
+ "text/plain": [
+ ""
+ ]
+ },
+ "metadata": {
+ "needs_background": "light"
+ },
+ "output_type": "display_data"
+ }
+ ],
+ "source": [
+ "plot(by_date)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 40,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "Hour Week\n",
+ "0 14 3030\n",
+ " 15 2665\n",
+ " 16 2316\n",
+ " 17 3343\n",
+ " 18 556\n",
+ " ... \n",
+ "23 14 4753\n",
+ " 15 4273\n",
+ " 16 4195\n",
+ " 17 5772\n",
+ " 18 1656\n",
+ "Length: 120, dtype: int64"
+ ]
+ },
+ "execution_count": 40,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ " data.groupby('Hour Week'.split()).apply(count)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 53,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | Weekday | \n",
+ " 0 | \n",
+ " 1 | \n",
+ " 2 | \n",
+ " 3 | \n",
+ " 4 | \n",
+ " 5 | \n",
+ " 6 | \n",
+ "
\n",
+ " \n",
+ " | Hour | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ " | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " | 0 | \n",
+ " 518 | \n",
+ " 765 | \n",
+ " 899 | \n",
+ " 792 | \n",
+ " 1367 | \n",
+ " 3027 | \n",
+ " 4542 | \n",
+ "
\n",
+ " \n",
+ " | 1 | \n",
+ " 261 | \n",
+ " 367 | \n",
+ " 507 | \n",
+ " 459 | \n",
+ " 760 | \n",
+ " 2479 | \n",
+ " 2936 | \n",
+ "
\n",
+ " \n",
+ " | 2 | \n",
+ " 238 | \n",
+ " 304 | \n",
+ " 371 | \n",
+ " 342 | \n",
+ " 513 | \n",
+ " 1577 | \n",
+ " 1590 | \n",
+ "
\n",
+ " \n",
+ " | 3 | \n",
+ " 571 | \n",
+ " 516 | \n",
+ " 585 | \n",
+ " 567 | \n",
+ " 736 | \n",
+ " 1013 | \n",
+ " 1052 | \n",
+ "
\n",
+ " \n",
+ " | 4 | \n",
+ " 1021 | \n",
+ " 887 | \n",
+ " 1003 | \n",
+ " 861 | \n",
+ " 932 | \n",
+ " 706 | \n",
+ " 685 | \n",
+ "
\n",
+ " \n",
+ " | 5 | \n",
+ " 1619 | \n",
+ " 1734 | \n",
+ " 1990 | \n",
+ " 1454 | \n",
+ " 1382 | \n",
+ " 704 | \n",
+ " 593 | \n",
+ "
\n",
+ " \n",
+ " | 6 | \n",
+ " 2974 | \n",
+ " 3766 | \n",
+ " 4230 | \n",
+ " 3179 | \n",
+ " 2836 | \n",
+ " 844 | \n",
+ " 669 | \n",
+ "
\n",
+ " \n",
+ " | 7 | \n",
+ " 3888 | \n",
+ " 5304 | \n",
+ " 5647 | \n",
+ " 4159 | \n",
+ " 3943 | \n",
+ " 1110 | \n",
+ " 873 | \n",
+ "
\n",
+ " \n",
+ " | 8 | \n",
+ " 3138 | \n",
+ " 4594 | \n",
+ " 5242 | \n",
+ " 3616 | \n",
+ " 3648 | \n",
+ " 1372 | \n",
+ " 1233 | \n",
+ "
\n",
+ " \n",
+ " | 9 | \n",
+ " 2211 | \n",
+ " 2962 | \n",
+ " 3846 | \n",
+ " 2654 | \n",
+ " 2732 | \n",
+ " 1764 | \n",
+ " 1770 | \n",
+ "
\n",
+ " \n",
+ " | 10 | \n",
+ " 1953 | \n",
+ " 2900 | \n",
+ " 3844 | \n",
+ " 2370 | \n",
+ " 2599 | \n",
+ " 2086 | \n",
+ " 2113 | \n",
+ "
\n",
+ " \n",
+ " | 11 | \n",
+ " 1929 | \n",
+ " 2949 | \n",
+ " 3889 | \n",
+ " 2516 | \n",
+ " 2816 | \n",
+ " 2315 | \n",
+ " 2360 | \n",
+ "
\n",
+ " \n",
+ " | 12 | \n",
+ " 1945 | \n",
+ " 2819 | \n",
+ " 3988 | \n",
+ " 2657 | \n",
+ " 2978 | \n",
+ " 2560 | \n",
+ " 2478 | \n",
+ "
\n",
+ " \n",
+ " | 13 | \n",
+ " 2294 | \n",
+ " 3556 | \n",
+ " 4469 | \n",
+ " 3301 | \n",
+ " 3535 | \n",
+ " 2685 | \n",
+ " 2763 | \n",
+ "
\n",
+ " \n",
+ " | 14 | \n",
+ " 3117 | \n",
+ " 4489 | \n",
+ " 5438 | \n",
+ " 4083 | \n",
+ " 4087 | \n",
+ " 3042 | \n",
+ " 2934 | \n",
+ "
\n",
+ " \n",
+ " | 15 | \n",
+ " 3818 | \n",
+ " 6042 | \n",
+ " 7071 | \n",
+ " 5182 | \n",
+ " 5354 | \n",
+ " 4457 | \n",
+ " 3400 | \n",
+ "
\n",
+ " \n",
+ " | 16 | \n",
+ " 4962 | \n",
+ " 7521 | \n",
+ " 8213 | \n",
+ " 6149 | \n",
+ " 6259 | \n",
+ " 5410 | \n",
+ " 3489 | \n",
+ "
\n",
+ " \n",
+ " | 17 | \n",
+ " 5574 | \n",
+ " 8297 | \n",
+ " 9151 | \n",
+ " 6951 | \n",
+ " 6790 | \n",
+ " 5558 | \n",
+ " 3154 | \n",
+ "
\n",
+ " \n",
+ " | 18 | \n",
+ " 4725 | \n",
+ " 7089 | \n",
+ " 8334 | \n",
+ " 6637 | \n",
+ " 7258 | \n",
+ " 6165 | \n",
+ " 2795 | \n",
+ "
\n",
+ " \n",
+ " | 19 | \n",
+ " 4386 | \n",
+ " 6459 | \n",
+ " 7794 | \n",
+ " 5929 | \n",
+ " 6247 | \n",
+ " 5529 | \n",
+ " 2579 | \n",
+ "
\n",
+ " \n",
+ " | 20 | \n",
+ " 3573 | \n",
+ " 6310 | \n",
+ " 7783 | \n",
+ " 6345 | \n",
+ " 5165 | \n",
+ " 4792 | \n",
+ " 2276 | \n",
+ "
\n",
+ " \n",
+ " | 21 | \n",
+ " 3079 | \n",
+ " 5993 | \n",
+ " 6921 | \n",
+ " 6585 | \n",
+ " 6265 | \n",
+ " 5811 | \n",
+ " 2310 | \n",
+ "
\n",
+ " \n",
+ " | 22 | \n",
+ " 1976 | \n",
+ " 3614 | \n",
+ " 4845 | \n",
+ " 5370 | \n",
+ " 6708 | \n",
+ " 6493 | \n",
+ " 1639 | \n",
+ "
\n",
+ " \n",
+ " | 23 | \n",
+ " 1091 | \n",
+ " 1948 | \n",
+ " 2571 | \n",
+ " 2909 | \n",
+ " 5393 | \n",
+ " 5719 | \n",
+ " 1018 | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
"
+ ],
+ "text/plain": [
+ "Weekday 0 1 2 3 4 5 6\n",
+ "Hour \n",
+ "0 518 765 899 792 1367 3027 4542\n",
+ "1 261 367 507 459 760 2479 2936\n",
+ "2 238 304 371 342 513 1577 1590\n",
+ "3 571 516 585 567 736 1013 1052\n",
+ "4 1021 887 1003 861 932 706 685\n",
+ "5 1619 1734 1990 1454 1382 704 593\n",
+ "6 2974 3766 4230 3179 2836 844 669\n",
+ "7 3888 5304 5647 4159 3943 1110 873\n",
+ "8 3138 4594 5242 3616 3648 1372 1233\n",
+ "9 2211 2962 3846 2654 2732 1764 1770\n",
+ "10 1953 2900 3844 2370 2599 2086 2113\n",
+ "11 1929 2949 3889 2516 2816 2315 2360\n",
+ "12 1945 2819 3988 2657 2978 2560 2478\n",
+ "13 2294 3556 4469 3301 3535 2685 2763\n",
+ "14 3117 4489 5438 4083 4087 3042 2934\n",
+ "15 3818 6042 7071 5182 5354 4457 3400\n",
+ "16 4962 7521 8213 6149 6259 5410 3489\n",
+ "17 5574 8297 9151 6951 6790 5558 3154\n",
+ "18 4725 7089 8334 6637 7258 6165 2795\n",
+ "19 4386 6459 7794 5929 6247 5529 2579\n",
+ "20 3573 6310 7783 6345 5165 4792 2276\n",
+ "21 3079 5993 6921 6585 6265 5811 2310\n",
+ "22 1976 3614 4845 5370 6708 6493 1639\n",
+ "23 1091 1948 2571 2909 5393 5719 1018"
+ ]
+ },
+ "execution_count": 53,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "by_cross = data.groupby('Hour Weekday'.split()).apply(count).unstack()\n",
+ "by_cross"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 55,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ ""
+ ]
+ },
+ "execution_count": 55,
+ "metadata": {},
+ "output_type": "execute_result"
+ },
+ {
+ "data": {
+ "image/png": "\n",
+ "text/plain": [
+ ""
+ ]
+ },
+ "metadata": {
+ "needs_background": "light"
+ },
+ "output_type": "display_data"
+ }
+ ],
+ "source": [
+ "import seaborn\n",
+ "seaborn.heatmap(by_cross)\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 57,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " Div | \n",
+ " Date | \n",
+ " HomeTeam | \n",
+ " AwayTeam | \n",
+ " FTHG | \n",
+ " FTAG | \n",
+ " FTR | \n",
+ " HTHG | \n",
+ " HTAG | \n",
+ " HTR | \n",
+ " ... | \n",
+ " BbAv<2.5 | \n",
+ " BbAH | \n",
+ " BbAHh | \n",
+ " BbMxAHH | \n",
+ " BbAvAHH | \n",
+ " BbMxAHA | \n",
+ " BbAvAHA | \n",
+ " PSCH | \n",
+ " PSCD | \n",
+ " PSCA | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " | 0 | \n",
+ " SP1 | \n",
+ " 17/08/2018 | \n",
+ " Betis | \n",
+ " Levante | \n",
+ " 0 | \n",
+ " 3 | \n",
+ " A | \n",
+ " 0 | \n",
+ " 1 | \n",
+ " A | \n",
+ " ... | \n",
+ " 2.06 | \n",
+ " 20 | \n",
+ " -0.75 | \n",
+ " 1.89 | \n",
+ " 1.85 | \n",
+ " 2.07 | \n",
+ " 2.00 | \n",
+ " 1.59 | \n",
+ " 4.42 | \n",
+ " 5.89 | \n",
+ "
\n",
+ " \n",
+ " | 1 | \n",
+ " SP1 | \n",
+ " 17/08/2018 | \n",
+ " Girona | \n",
+ " Valladolid | \n",
+ " 0 | \n",
+ " 0 | \n",
+ " D | \n",
+ " 0 | \n",
+ " 0 | \n",
+ " D | \n",
+ " ... | \n",
+ " 1.71 | \n",
+ " 20 | \n",
+ " -0.75 | \n",
+ " 2.06 | \n",
+ " 2.01 | \n",
+ " 1.90 | \n",
+ " 1.85 | \n",
+ " 1.76 | \n",
+ " 3.57 | \n",
+ " 5.62 | \n",
+ "
\n",
+ " \n",
+ " | 2 | \n",
+ " SP1 | \n",
+ " 18/08/2018 | \n",
+ " Barcelona | \n",
+ " Alaves | \n",
+ " 3 | \n",
+ " 0 | \n",
+ " H | \n",
+ " 0 | \n",
+ " 0 | \n",
+ " D | \n",
+ " ... | \n",
+ " 3.18 | \n",
+ " 19 | \n",
+ " -2.50 | \n",
+ " 1.95 | \n",
+ " 1.91 | \n",
+ " 2.00 | \n",
+ " 1.95 | \n",
+ " 1.10 | \n",
+ " 11.85 | \n",
+ " 32.17 | \n",
+ "
\n",
+ " \n",
+ " | 3 | \n",
+ " SP1 | \n",
+ " 18/08/2018 | \n",
+ " Celta | \n",
+ " Espanol | \n",
+ " 1 | \n",
+ " 1 | \n",
+ " D | \n",
+ " 0 | \n",
+ " 1 | \n",
+ " A | \n",
+ " ... | \n",
+ " 1.76 | \n",
+ " 18 | \n",
+ " -0.75 | \n",
+ " 2.26 | \n",
+ " 2.18 | \n",
+ " 1.74 | \n",
+ " 1.71 | \n",
+ " 2.18 | \n",
+ " 3.26 | \n",
+ " 3.85 | \n",
+ "
\n",
+ " \n",
+ " | 4 | \n",
+ " SP1 | \n",
+ " 18/08/2018 | \n",
+ " Villarreal | \n",
+ " Sociedad | \n",
+ " 1 | \n",
+ " 2 | \n",
+ " A | \n",
+ " 1 | \n",
+ " 1 | \n",
+ " D | \n",
+ " ... | \n",
+ " 1.81 | \n",
+ " 18 | \n",
+ " -0.25 | \n",
+ " 1.76 | \n",
+ " 1.74 | \n",
+ " 2.23 | \n",
+ " 2.14 | \n",
+ " 2.32 | \n",
+ " 3.21 | \n",
+ " 3.53 | \n",
+ "
\n",
+ " \n",
+ " | ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ " ... | \n",
+ "
\n",
+ " \n",
+ " | 375 | \n",
+ " SP1 | \n",
+ " 18/05/2019 | \n",
+ " Levante | \n",
+ " Ath Madrid | \n",
+ " 2 | \n",
+ " 2 | \n",
+ " D | \n",
+ " 2 | \n",
+ " 0 | \n",
+ " H | \n",
+ " ... | \n",
+ " 2.23 | \n",
+ " 18 | \n",
+ " 0.50 | \n",
+ " 1.91 | \n",
+ " 1.87 | \n",
+ " 2.04 | \n",
+ " 1.99 | \n",
+ " 4.34 | \n",
+ " 4.10 | \n",
+ " 1.81 | \n",
+ "
\n",
+ " \n",
+ " | 376 | \n",
+ " SP1 | \n",
+ " 18/05/2019 | \n",
+ " Sevilla | \n",
+ " Ath Bilbao | \n",
+ " 2 | \n",
+ " 0 | \n",
+ " H | \n",
+ " 1 | \n",
+ " 0 | \n",
+ " H | \n",
+ " ... | \n",
+ " 2.08 | \n",
+ " 19 | \n",
+ " -1.00 | \n",
+ " 2.70 | \n",
+ " 2.60 | \n",
+ " 1.60 | \n",
+ " 1.53 | \n",
+ " 2.17 | \n",
+ " 3.08 | \n",
+ " 4.15 | \n",
+ "
\n",
+ " \n",
+ " | 377 | \n",
+ " SP1 | \n",
+ " 18/05/2019 | \n",
+ " Valladolid | \n",
+ " Valencia | \n",
+ " 0 | \n",
+ " 2 | \n",
+ " A | \n",
+ " 0 | \n",
+ " 1 | \n",
+ " A | \n",
+ " ... | \n",
+ " 2.25 | \n",
+ " 20 | \n",
+ " 1.50 | \n",
+ " 1.78 | \n",
+ " 1.74 | \n",
+ " 2.20 | \n",
+ " 2.13 | \n",
+ " 8.01 | \n",
+ " 5.13 | \n",
+ " 1.40 | \n",
+ "
\n",
+ " \n",
+ " | 378 | \n",
+ " SP1 | \n",
+ " 19/05/2019 | \n",
+ " Eibar | \n",
+ " Barcelona | \n",
+ " 2 | \n",
+ " 2 | \n",
+ " D | \n",
+ " 2 | \n",
+ " 2 | \n",
+ " D | \n",
+ " ... | \n",
+ " 2.65 | \n",
+ " 19 | \n",
+ " 0.50 | \n",
+ " 2.03 | \n",
+ " 1.98 | \n",
+ " 1.92 | \n",
+ " 1.88 | \n",
+ " 4.96 | \n",
+ " 4.55 | \n",
+ " 1.65 | \n",
+ "
\n",
+ " \n",
+ " | 379 | \n",
+ " SP1 | \n",
+ " 19/05/2019 | \n",
+ " Real Madrid | \n",
+ " Betis | \n",
+ " 0 | \n",
+ " 2 | \n",
+ " A | \n",
+ " 0 | \n",
+ " 0 | \n",
+ " D | \n",
+ " ... | \n",
+ " 3.42 | \n",
+ " 23 | \n",
+ " -1.00 | \n",
+ " 1.94 | \n",
+ " 1.91 | \n",
+ " 2.01 | \n",
+ " 1.98 | \n",
+ " 1.33 | \n",
+ " 6.38 | \n",
+ " 8.09 | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
380 rows × 61 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " Div Date HomeTeam AwayTeam FTHG FTAG FTR HTHG HTAG HTR \\\n",
+ "0 SP1 17/08/2018 Betis Levante 0 3 A 0 1 A \n",
+ "1 SP1 17/08/2018 Girona Valladolid 0 0 D 0 0 D \n",
+ "2 SP1 18/08/2018 Barcelona Alaves 3 0 H 0 0 D \n",
+ "3 SP1 18/08/2018 Celta Espanol 1 1 D 0 1 A \n",
+ "4 SP1 18/08/2018 Villarreal Sociedad 1 2 A 1 1 D \n",
+ ".. ... ... ... ... ... ... .. ... ... .. \n",
+ "375 SP1 18/05/2019 Levante Ath Madrid 2 2 D 2 0 H \n",
+ "376 SP1 18/05/2019 Sevilla Ath Bilbao 2 0 H 1 0 H \n",
+ "377 SP1 18/05/2019 Valladolid Valencia 0 2 A 0 1 A \n",
+ "378 SP1 19/05/2019 Eibar Barcelona 2 2 D 2 2 D \n",
+ "379 SP1 19/05/2019 Real Madrid Betis 0 2 A 0 0 D \n",
+ "\n",
+ " ... BbAv<2.5 BbAH BbAHh BbMxAHH BbAvAHH BbMxAHA BbAvAHA PSCH \\\n",
+ "0 ... 2.06 20 -0.75 1.89 1.85 2.07 2.00 1.59 \n",
+ "1 ... 1.71 20 -0.75 2.06 2.01 1.90 1.85 1.76 \n",
+ "2 ... 3.18 19 -2.50 1.95 1.91 2.00 1.95 1.10 \n",
+ "3 ... 1.76 18 -0.75 2.26 2.18 1.74 1.71 2.18 \n",
+ "4 ... 1.81 18 -0.25 1.76 1.74 2.23 2.14 2.32 \n",
+ ".. ... ... ... ... ... ... ... ... ... \n",
+ "375 ... 2.23 18 0.50 1.91 1.87 2.04 1.99 4.34 \n",
+ "376 ... 2.08 19 -1.00 2.70 2.60 1.60 1.53 2.17 \n",
+ "377 ... 2.25 20 1.50 1.78 1.74 2.20 2.13 8.01 \n",
+ "378 ... 2.65 19 0.50 2.03 1.98 1.92 1.88 4.96 \n",
+ "379 ... 3.42 23 -1.00 1.94 1.91 2.01 1.98 1.33 \n",
+ "\n",
+ " PSCD PSCA \n",
+ "0 4.42 5.89 \n",
+ "1 3.57 5.62 \n",
+ "2 11.85 32.17 \n",
+ "3 3.26 3.85 \n",
+ "4 3.21 3.53 \n",
+ ".. ... ... \n",
+ "375 4.10 1.81 \n",
+ "376 3.08 4.15 \n",
+ "377 5.13 1.40 \n",
+ "378 4.55 1.65 \n",
+ "379 6.38 8.09 \n",
+ "\n",
+ "[380 rows x 61 columns]"
+ ]
+ },
+ "execution_count": 57,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "season = pd.read_csv('season-1819_csv.csv')\n",
+ "season"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 61,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "Index(['Div', 'Date', 'HomeTeam', 'AwayTeam', 'FTHG', 'FTAG', 'FTR', 'HTHG',\n",
+ " 'HTAG', 'HTR', 'HS', 'AS', 'HST', 'AST', 'HF', 'AF', 'HC', 'AC', 'HY',\n",
+ " 'AY', 'HR', 'AR', 'B365H', 'B365D', 'B365A', 'BWH', 'BWD', 'BWA', 'IWH',\n",
+ " 'IWD', 'IWA', 'PSH', 'PSD', 'PSA', 'WHH', 'WHD', 'WHA', 'VCH', 'VCD',\n",
+ " 'VCA', 'Bb1X2', 'BbMxH', 'BbAvH', 'BbMxD', 'BbAvD', 'BbMxA', 'BbAvA',\n",
+ " 'BbOU', 'BbMx>2.5', 'BbAv>2.5', 'BbMx<2.5', 'BbAv<2.5', 'BbAH', 'BbAHh',\n",
+ " 'BbMxAHH', 'BbAvAHH', 'BbMxAHA', 'BbAvAHA', 'PSCH', 'PSCD', 'PSCA'],\n",
+ " dtype='object')"
+ ]
+ },
+ "execution_count": 61,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "season.columns"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "metadata": {},
+ "outputs": [],
+ "source": []
+ }
+ ],
+ "metadata": {
+ "kernelspec": {
+ "display_name": "Python 3",
+ "language": "python",
+ "name": "python3"
+ },
+ "language_info": {
+ "codemirror_mode": {
+ "name": "ipython",
+ "version": 3
+ },
+ "file_extension": ".py",
+ "mimetype": "text/x-python",
+ "name": "python",
+ "nbconvert_exporter": "python",
+ "pygments_lexer": "ipython3",
+ "version": "3.8.3"
+ }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 4
+}