-
Notifications
You must be signed in to change notification settings - Fork 33
/
Copy pathworld_data.py
executable file
·158 lines (131 loc) · 5.51 KB
/
world_data.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
import json
import dateutil.parser
import datetime
import os.path
import time
import shared
import fetch_data
fetch_data.handle_fetch()
def dates_to_days(XDates):
XDays = []
for date in XDates:
XDays.append((date - min(XDates)).days)
XDays.sort()
return XDays
with open(shared.FILENAME) as f:
s = f.read()
s = s.replace('Iran (Islamic Republic of)', 'Iran') # obsolete?
s = s.replace('Mainland China', 'China') # obsolete ?
s = s.replace('Korea, South', 'South Korea')
print("read data: %i bytes" % len(s))
d = json.loads(s)
# todo check for unknown excluded countries
def get_country_xcdr(country='all', province='all', excludeCountries=[], excludeProvinces=[],
dateOffset=0, returnLists=False, returnDates=False, verbose=True):
country = '' if country == 'all' else country # empty string is same as all
province = '' if province == 'all' else province
countries = {}
provinces = {}
dictXYYY = {}
XDatesAll = []
for i, location in enumerate(d['confirmed']['locations']):
XDates = []
YConfirmed = []
YDeaths = []
YRecovered = []
listXYYY = []
countries[str(location['country'])] = 1
provinces[str(location['province'])] = 1
if country != '' and location['country'] != country:
continue
if location['country'] in excludeCountries:
print("Excluded country/province:", location['country'], location['province'])
continue
if province != '' and location['province'] != province:
continue
if location['province'] in excludeProvinces: # global provinces can't have the same name
print("Excluded country/province:", location['country'], location['province'])
continue
for date in location['history']:
confirmed = int(location['history'][date])
deaths = int(d['deaths']['locations'][i]['history'][date])
try:
recovered = int(d['recovered']['locations'][i]['history'][date])
except (KeyError, IndexError):
recovered = 0
XDates.append(dateutil.parser.parse(date))
YConfirmed.append(confirmed)
YDeaths.append(deaths)
YRecovered.append(recovered)
for i, date in enumerate(XDates):
if date in dictXYYY:
dictXYYY[date][0] += YConfirmed[i]
dictXYYY[date][1] += YDeaths[i]
dictXYYY[date][2] += YRecovered[i]
else:
dictXYYY[date] = [YConfirmed[i], YDeaths[i], YRecovered[i]]
XDatesAll.extend(XDates)
listXYYY = []
XDatesAllNonEmpty = []
for date in dictXYYY:
day = (date - min(XDatesAll)).days + dateOffset
C, D, R = dictXYYY[date][0], dictXYYY[date][1], dictXYYY[date][2]
if (C + D + R) > 0:
if returnDates:
x = date
else:
x = day
listXYYY.append((x, C, D, R))
XDatesAllNonEmpty.append(date)
listXYYY.sort() # in place by first item
# parse countries just to display available ones in case of error
if returnLists:
countries = list(countries.keys())
countries.sort()
provinces = list(provinces.keys())
provinces.sort()
return countries, provinces
if len(listXYYY) == 0:
countries, provinces = get_countries_provinces()
if not country in countries:
print(countries)
if not province in provinces:
print()
print(provinces)
raise Exception("get_country_xcdr empty - country '%s' or province '%s' not found?" % (country, province))
if verbose:
print("todays date: %s" % datetime.date.today())
print("data points for %s: %s" % (country, len(listXYYY)))
print("first data: %s" % min(XDatesAllNonEmpty).date())
print("latest data: %s (you can update the data manually by running fetch_data.py)" % max(XDatesAll).date())
return listXYYY
def get_countries_provinces(): # todo: make this a separate function for easier readability
countries, provinces = get_country_xcdr(returnLists=True)
return countries, provinces
if __name__ == '__main__':
import numpy as np
import matplotlib.pyplot as plt
fig = plt.figure(figsize=(10,10), dpi=200)
ax = fig.add_subplot(211)
COUNTRY = 'Italy'
PROVINCE = 'all'
XYYY = np.array(get_country_xcdr(COUNTRY, PROVINCE))
X = XYYY[:,0]
#ax.set_yscale("log", nonposy='clip')
ax.plot(X, XYYY[:,1], 'b', alpha=0.5, lw=2, label='confirmed')
ax.plot(X, XYYY[:,2], 'y', alpha=0.5, lw=2, label='deaths')
ax.plot(X, XYYY[:,3], 'r--', alpha=0.5, lw=1, label='recovered')
ax.legend(title='COVID-19 data (beta): ' + COUNTRY + " " + PROVINCE)
ax2 = fig.add_subplot(212)
COUNTRY = 'all'
excludeCountries = ['China']
PROVINCE = 'all'
XYYY = np.array(get_country_xcdr(COUNTRY, PROVINCE, excludeCountries=excludeCountries))
X = XYYY[:,0]
#ax2.set_yscale("log", nonposy='clip')
ax2.plot(X, XYYY[:,1], 'b', alpha=0.5, lw=2, label='confirmed')
ax2.plot(X, XYYY[:,2], 'y', alpha=0.5, lw=2, label='deaths')
ax2.plot(X, XYYY[:,3], 'r--', alpha=0.5, lw=1, label='recovered')
ax2.legend(title='COVID-19 data (beta): all but China')
plt.show()
#plt.savefig('data.png')