-
Notifications
You must be signed in to change notification settings - Fork 0
/
editDataSpain.py
29 lines (23 loc) · 882 Bytes
/
editDataSpain.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
import os, glob
import pandas
import re
def editDataES():
abspath = os.path.abspath(__file__)
dname = os.path.dirname(abspath)
os.chdir(dname)
inputLoc = "../Data/Sources/ES/COVID 19/"
all_files = glob.glob(os.path.join(inputLoc, "*long.csv"))
all_df = []
for f in all_files:
df = pandas.read_csv(f, sep=',')
df['variable'] = re.findall('(ccaa_covid19_)(.*)(_long)', f)[0][1]
all_df.append(df)
dfES = pandas.concat(all_df, ignore_index=True, sort=True)
# Load variable names:
varNames = pandas.read_csv('variableTable_ALL.csv', index_col="ES")[["Measure"]].to_dict()['Measure']
dfES['variable'] = pandas.Categorical(dfES['variable'])\
.rename_categories(varNames)
dfES.columns = ['Region', 'RegionCode', 'Date', 'value', 'variable']
dfES['Country'] = 'ES'
return dfES
dfES = editDataES()