-
Notifications
You must be signed in to change notification settings - Fork 0
/
trial_details.txt
269 lines (237 loc) · 5.26 KB
/
trial_details.txt
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
Trial 1 Parameters:
-------------------------
lr: 0.0060547536754836685
hidden_size: 80
num_layers: 2
sync_rate: 9
a_start: 0.7546054852624321
b_start: 0.6014487599094669
a_end: 0.22361955510181494
b_end: 0.015434136218467252
a_last_episode: 1992
b_last_episode: 1029
sigma: 0.7565081545269917
Max Reward: -0.22287461161613464
Trial 2 Parameters:
-------------------------
lr: 0.0021741337096116337
hidden_size: 413
num_layers: 2
sync_rate: 6
a_start: 0.6801494613705947
b_start: 0.6231213528463587
a_end: 0.13412713824928874
b_end: 0.15800063786150717
a_last_episode: 767
b_last_episode: 1679
sigma: 0.9439189469085211
Max Reward: -9999
Trial 1 Parameters:
-------------------------
lr: 0.005415830704708877
hidden_size: 369
num_layers: 2
sync_rate: 6
a_start: 0.6007267671775257
b_start: 0.8984131488544513
a_end: 0.2534446089062141
b_end: 0.05425089562501308
a_last_episode: 1185
b_last_episode: 1383
sigma: 0.9966979790809836
Max Reward: -0.27519628405570984
Trial 2 Parameters:
-------------------------
lr: 0.006756331889267519
hidden_size: 112
num_layers: 4
sync_rate: 4
a_start: 0.7983209400471342
b_start: 0.6510435650505203
a_end: 0.26782001247604637
b_end: 0.15883086439391836
a_last_episode: 606
b_last_episode: 1254
sigma: 0.8362227130290028
Max Reward: -1.1987535953521729
Trial 3 Parameters:
-------------------------
lr: 0.0054373009253962535
hidden_size: 160
num_layers: 3
sync_rate: 3
a_start: 0.9938722141813819
b_start: 0.6873888124517772
a_end: 0.17885439147430005
b_end: 0.03596797575114374
a_last_episode: 550
b_last_episode: 546
sigma: 0.932908913083222
Max Reward: -0.4606098532676697
Trial 4 Parameters:
-------------------------
lr: 0.0016844012859661562
hidden_size: 88
num_layers: 1
sync_rate: 1
a_start: 0.6732657331186468
b_start: 0.6495077404268287
a_end: 0.18895875587765215
b_end: 0.12141266588918598
a_last_episode: 1947
b_last_episode: 717
sigma: 0.6513775735522214
Max Reward: -0.30024203658103943
Trial 5 Parameters:
-------------------------
lr: 0.0034633918580646993
hidden_size: 501
num_layers: 4
sync_rate: 3
a_start: 0.8461141029081797
b_start: 0.6560030542177767
a_end: 0.12546293922245225
b_end: 0.05137430286307736
a_last_episode: 1024
b_last_episode: 1810
sigma: 0.37824813003979574
Max Reward: -1.0082851648330688
Trial 6 Parameters:
-------------------------
lr: 0.0018771685890684752
hidden_size: 173
num_layers: 4
sync_rate: 7
a_start: 0.8469652918162813
b_start: 0.7317471863855722
a_end: 0.11076798444940009
b_end: 0.03462904710420782
a_last_episode: 1595
b_last_episode: 1482
sigma: 0.19951006630182577
Max Reward: -1.2910088300704956
Trial 7 Parameters:
-------------------------
lr: 0.003417794864858785
hidden_size: 70
num_layers: 3
sync_rate: 10
a_start: 0.8085311980949843
b_start: 0.6425260705200779
a_end: 0.2693462561623857
b_end: 0.17748913395169344
a_last_episode: 1689
b_last_episode: 787
sigma: 0.31265445919632223
Max Reward: -9999
Trial 1 Parameters:
-------------------------
lr: 0.00805470822926657
hidden_size: 495
num_layers: 1
sync_rate: 2
a_start: 0.6412880437984753
b_start: 0.9260038141702474
a_end: 0.132446282181354
b_end: 0.10877554124999125
a_last_episode: 621
b_last_episode: 1872
sigma: 0.3967210190900776
Max Reward: -9999
Trial 1 Parameters:
-------------------------
lr: 0.007809621329621953
hidden_size: 377
num_layers: 2
sync_rate: 6
a_start: 0.7584854398994391
b_start: 0.7370714593925317
a_end: 0.10725587794017298
b_end: 0.1856894138376594
a_last_episode: 1298
b_last_episode: 778
sigma: 0.8880989183131195
Max Reward: -9999
Trial 1 Parameters:
-------------------------
lr: 0.005365365508976488
hidden_size: 233
num_layers: 1
sync_rate: 5
a_start: 0.9762036578532075
b_start: 0.7443912675552409
a_end: 0.14902997006604904
b_end: 0.018446614683500673
a_last_episode: 1926
b_last_episode: 1200
sigma: 0.5277136721216977
Max Reward: -9999
Trial 1 Parameters:
-------------------------
lr: 0.001158316697378192
hidden_size: 479
num_layers: 1
sync_rate: 7
a_start: 0.9013665291054777
b_start: 0.7231103369393888
a_end: 0.13606871962101647
b_end: 0.07116233226621796
a_last_episode: 1665
b_last_episode: 1954
sigma: 0.6674885077904684
Max Reward: -9999
Trial 1 Parameters:
-------------------------
lr: 0.007959881081803498
hidden_size: 224
num_layers: 2
sync_rate: 2
a_start: 0.8143017294524554
b_start: 0.6665479248219891
a_end: 0.20906936940777995
b_end: 0.02798460648176243
a_last_episode: 924
b_last_episode: 559
sigma: 0.5132546131846938
Max Reward: -9999
Trial 1 Parameters:
-------------------------
lr: 0.006570707509928243
hidden_size: 77
num_layers: 1
sync_rate: 7
a_start: 0.781908459037425
b_start: 0.6336991216861404
a_end: 0.268077752415272
b_end: 0.11642230086654967
a_last_episode: 1250
b_last_episode: 626
sigma: 0.1711142759528855
Max Reward: -9999
Trial 1 Parameters:
-------------------------
lr: 0.00040401115090463717
hidden_size: 471
num_layers: 4
sync_rate: 10
a_start: 0.8822656715213817
b_start: 0.641420843855454
a_end: 0.29810154388569254
b_end: 0.018523403499779177
a_last_episode: 1258
b_last_episode: 849
sigma: 0.6167071020732507
Max Reward: -9999
Trial 1 Parameters:
-------------------------
lr: 0.004982617212386112
hidden_size: 374
num_layers: 2
sync_rate: 6
a_start: 0.9247143738665486
b_start: 0.6179189571216942
a_end: 0.16509594545677678
b_end: 0.13656838747974184
a_last_episode: 1818
b_last_episode: 1521
sigma: 0.944895801271307