-
-
Notifications
You must be signed in to change notification settings - Fork 7
/
Copy pathcovid19_prepare_data.py
66 lines (45 loc) · 1.81 KB
/
covid19_prepare_data.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
# coding: utf-8
# In[1]:
import requests
from datetime import datetime
import pandas as pd
# In[2]:
def build_country_data(country):
res = []
keys = country.get('timeline').get('cases').keys()
for key in keys:
target_entry = {}
target_entry['Report_Date'] = key
country_name = country.get('country')
if country.get('province') != None:
country_name = country_name + '_' + country.get('province')
target_entry[country_name + '_cases'] = country.get('timeline').get('cases').get(key)
target_entry[country_name + '_deaths'] = country.get('timeline').get('deaths').get(key)
target_entry[country_name + '_recovered'] = country.get('timeline').get('recovered').get(key)
res.append(target_entry)
return res
# In[5]:
def build_covid19_data():
request_str = 'https://corona.lmao.ninja/v2/historical?lastdays=all'
response = requests.get(request_str)
json_data = response.json() if response and response.status_code == 200 else None
df = None
for country in json_data:
res = build_country_data(country)
if df is None:
df = pd.DataFrame(res)
df.index = pd.DatetimeIndex(df['Report_Date'])
df = df.drop('Report_Date', 1)
df = df.sort_values(by=['Report_Date'])
else:
df_new = pd.DataFrame(res)
df_new.index = pd.DatetimeIndex(df_new['Report_Date'])
df_new = df_new.drop('Report_Date', 1)
df_new = df_new.sort_values(by=['Report_Date'])
df = df.merge(df_new, left_index=True, right_index=True)
df.to_csv('data/covid19_data.csv')
df_backtesting = df.iloc[:-5]
df_backtesting.to_csv('data/covid19_data_backtesting.csv')
return df
# In[6]:
# df = build_covid19_data()