-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathcombineDataset.py
126 lines (109 loc) · 3.87 KB
/
combineDataset.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
newDataSetFile = open("finalDataset.txt", 'w+')
i=1
fileOurLabelledTweets = open("labeledTweetDataset.txt",'r')
fileBoston = open("Boston4C.csv",'r')
fileChicago = open("Chicago4C.csv",'r')
fileMemphis = open("Memphis4C.csv",'r')
fileNYC = open("NYC4C.csv",'r')
fileSanF = open("SanFrancisco4Classes.csv",'r')
fileSeattle = open("Seattle4Classes.csv",'r')
lines = fileOurLabelledTweets.readlines()
for eachLine in lines:
newDataSetFile.write(eachLine)
i=i+1
print(i)
lines = fileBoston.readlines()
for eachLine in lines:
fields=eachLine.split(';');
if(len(fields)== 3):
tweet= fields[1]+"::::::"
fields[2]= fields[2].strip('\n')
if(fields[2]=="fire" or fields[2]=="shooting" or fields[2]=="NO" or fields[2]=="fire\n" or fields[2]=="shooting\n" or fields[2]=="NO\n"):
tweet+="0\n"
elif(fields[2] == "crash" or fields[2] == "crash\n"):
tweet+="1\n"
else:
print("error")
print(fields[2]+"XX")
newDataSetFile.write(tweet)
i=i+1
print(i)
lines = fileChicago.readlines()
for eachLine in lines:
fields=eachLine.split(';');
if(len(fields)== 3):
tweet = fields[1] + "::::::"
fields[2] = fields[2].strip('\n')
if (fields[2]=="fire" or fields[2]=="shooting" or fields[2]=="NO" or fields[2]=="fire\n" or fields[2]=="shooting\n" or fields[2]=="NO\n"):
tweet += "0\n"
elif (fields[2] == "crash" or fields[2] == "crash\n"):
tweet += "1\n"
else:
print("error")
print(fields[2]+"XX")
newDataSetFile.write(tweet)
i=i+1
print(i)
lines = fileMemphis.readlines()
for eachLine in lines:
fields=eachLine.split(';');
if(len(fields)== 3):
tweet = fields[1] + "::::::"
fields[2] = fields[2].strip('\n')
if (fields[2]=="fire" or fields[2]=="shooting" or fields[2]=="NO" or fields[2]=="fire\n" or fields[2]=="shooting\n" or fields[2]=="NO\n"):
tweet += "0\n"
elif (fields[2] == "crash" or fields[2] == "crash\n"):
tweet += "1\n"
else:
print("error")
print(fields[2]+"XX")
newDataSetFile.write(tweet)
i=i+1
print(i)
lines = fileNYC.readlines()
for eachLine in lines:
fields=eachLine.split(';');
if(len(fields)== 3):
tweet = fields[1] + "::::::"
fields[2] = fields[2].strip('\n')
if (fields[2]=="fire" or fields[2]=="shooting" or fields[2]=="NO" or fields[2]=="fire\n" or fields[2]=="shooting\n" or fields[2]=="NO\n"):
tweet += "0\n"
elif (fields[2] == "crash" or fields[2] == "crash\n"):
tweet += "1\n"
else:
print("error")
print(fields[2]+"XX")
newDataSetFile.write(tweet)
i=i+1
print(i)
lines = fileSanF.readlines()
for eachLine in lines:
fields=eachLine.split(';');
if(len(fields)== 3):
tweet = fields[1] + "::::::"
if (fields[2]=="fire" or fields[2]=="shooting" or fields[2]=="NO" or fields[2]=="fire\n" or fields[2]=="shooting\n" or fields[2]=="NO\n"):
tweet += "0\n"
elif (fields[2] == "crash" or fields[2] == "crash\n"):
tweet += "1\n"
else:
print("error")
print(fields[2]+"XX")
newDataSetFile.write(tweet)
i=i+1
print(i)
lines = fileSeattle.readlines()
for eachLine in lines:
fields=eachLine.split(';');
if(len(fields)== 3):
tweet = fields[1] + "::::::"
fields[2] = fields[2].strip('\n')
if (fields[2]=="fire" or fields[2]=="shooting" or fields[2]=="NO" or fields[2]=="fire\n" or fields[2]=="shooting\n" or fields[2]=="NO\n"):
tweet += "0\n"
elif (fields[2] == "crash" or fields[2] == "crash\n"):
tweet += "1\n"
else:
print("error")
print(fields[2]+"XX")
newDataSetFile.write(tweet)
i=i+1
print(i)