-
Notifications
You must be signed in to change notification settings - Fork 0
/
create_dataset.py
134 lines (130 loc) · 3.03 KB
/
create_dataset.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
import pandas as pd
# Define the data dictionary with reviews and corresponding sentiments
data = {
'review': [
"this movie is so good! i love it",
"worst film , i hate it the most",
"pakka 1000cr, super hit! amazing",
"this movie is so good! i love it!",
"loved it will watch again",
"not bad , just okay!",
"average, one time watch",
"one man show",
"jabardasth",
"great movie",
"i hate that movie worst of all time",
"good movie, can be done better",
"had an amazing time there",
"i personally didnt like it!",
"dont go with family",
"Can watch 1 time",
# Additional positive reviews
"absolutely fantastic!",
"enjoyed every moment",
"brilliant performance by the cast",
"a masterpiece",
"loved the storyline",
"wonderful cinematography",
"superb direction",
"a must-watch",
"amazing experience",
"truly a great movie",
"fantastic, would watch again",
"loved it, highly recommend",
"excellent film",
"just perfect!",
"best movie of the year",
"it was a great watch",
"stellar performances",
"great soundtrack",
"captivating and thrilling",
"an extraordinary film",
# Additional negative reviews
"terrible movie, complete waste of time",
"horrible film, do not recommend",
"the worst movie I have ever seen",
"awful, just awful",
"boring and predictable",
"not worth watching",
"disappointing from start to finish",
"poor acting and storyline",
"too slow and dull",
"uninteresting and long",
"bad script and execution",
"overhyped and underwhelming",
"not entertaining at all",
"painfully bad",
"wish I hadn't watched it",
"felt like a chore to watch",
"badly made movie",
"nothing good about it",
"would not watch again",
"avoid at all costs"
],
'sentiment': [
1,
0,
1,
1,
1,
0,
0,
1,
1,
1,
0,
1,
1,
0,
0,
0,
# Sentiments for additional positive reviews
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
1,
# Sentiments for additional negative reviews
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0,
0
]
}
# Create a DataFrame from the data dictionary
data_frame = pd.DataFrame(data)
# Save the DataFrame to a CSV file
data_frame.to_csv('movie_reviews.csv', index=False)
# Print a success message
print("Data created successfully!")