@@ -54,16 +54,14 @@ def check_date_format(date_string):
54
54
55
55
return (new_date )
56
56
57
- def get_revised_data (base_url ):
58
- headers = {
59
- 'User-Agent' : 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/126.0.0.0 Safari/537.36'
60
- }
61
-
57
+ def get_dashboard_update_date (base_url ,headers ):
62
58
# Get update date
63
59
update_date_url = base_url + DASHBOARD_UPDATE_DATE_FILE
64
60
update_date_url_response = requests .get (update_date_url , headers = headers )
65
61
update_date = datetime .strptime (update_date_url_response .text ,"%m/%d/%Y %H:%M:%S" ).strftime ("%Y-%m-%d" )
62
+ return (update_date )
66
63
64
+ def get_revised_data (base_url ,headers ,update_date ):
67
65
# Get update data
68
66
url = base_url + DASHBOARD_DATA_FILE
69
67
@@ -80,7 +78,7 @@ def get_revised_data(base_url):
80
78
df ['geo_type' ] = [create_geo_types (g ,"province" ) for g in df ['geo_value' ]]
81
79
df .insert (1 ,"issue" ,update_date )
82
80
83
- df = df .drop (["weekorder" ,"region" ,"year" ,"week" ],axis = 1 )
81
+ # df=df.drop(["weekorder","region","year","week"],axis=1)
84
82
85
83
df = df .pivot (index = ['epiweek' ,'time_value' ,'issue' ,'geo_type' ,'geo_value' ],
86
84
columns = "virus" ,values = ['tests' ,'percentpositive' ,'positivetests' ])
@@ -96,16 +94,7 @@ def get_revised_data(base_url):
96
94
97
95
return (df )
98
96
99
- def get_weekly_data (base_url ,start_year ):
100
- headers = {
101
- 'User-Agent' : 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/126.0.0.0 Safari/537.36'
102
- }
103
-
104
- # Get update date
105
- update_date_url = base_url + "RVD_UpdateDate.csv"
106
- update_date_url_response = requests .get (update_date_url , headers = headers )
107
- update_date = datetime .strptime (update_date_url_response .text ,"%m/%d/%Y %H:%M:%S" ).strftime ("%Y-%m-%d" )
108
-
97
+ def get_weekly_data (base_url ,start_year ,headers ,update_date ):
109
98
# Get current week and year
110
99
summary_url = base_url + "RVD_SummaryText.csv"
111
100
summary_url_response = requests .get (summary_url , headers = headers )
@@ -145,7 +134,7 @@ def get_weekly_data(base_url,start_year):
145
134
df_weekly ['geo_value' ] = [abbreviate_geo (g ) for g in df_weekly ['geo_value' ]]
146
135
df_weekly ['geo_type' ] = [create_geo_types (g ,"lab" ) for g in df_weekly ['geo_value' ]]
147
136
148
- if df_weekly .columns .isin (["weekorder" ,"date" ,"week" ]).all ():
149
- df_weekly = df_weekly .drop (["weekorder" ,"date" ,"week" ],axis = 1 )
137
+ # if df_weekly.columns.isin(["weekorder","date","week"]).all():
138
+ # df_weekly=df_weekly.drop(["weekorder","date","week"],axis=1)
150
139
151
140
return (df_weekly )
0 commit comments