-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathmultibattle_test.csv
We can make this file beautiful and searchable if this error is corrected: It looks like row 21 should actually have 5 columns, instead of 4 in line 20.
213 lines (213 loc) · 12.7 KB
/
multibattle_test.csv
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
Episode,Test Reward per step,Test Total Reward,Q Loss,Encoder Loss
Episode,Test Reward per step,Test Total Reward,Q Loss,Encoder Loss
Episode,Test Reward per step,Test Total Reward,Q Loss,Encoder Loss
Episode,Test Reward per step,Test Total Reward,Q Loss,Encoder Loss
Episode,Test Reward per step,Test Total Reward,Q Loss,Encoder Loss
Episode,Test Reward per step,Test Total Reward,Q Loss,Encoder Loss
Episode,Test Reward per step,Test Total Reward,Q Loss,Encoder Loss
Episode,Test Reward per step,Test Total Reward,Q Loss,Encoder Loss
Episode,Test Reward per step,Test Total Reward,Q Loss,Encoder Loss
Episode,Test Reward per step,Test Total Reward,Q Loss,Encoder Loss
Episode,Test Reward per step,Test Total Reward,Q Loss,Encoder Loss
Episode,Test Reward per step,Test Total Reward,Q Loss,Encoder Loss
Episode,Test Reward per step,Test Total Reward,Q Loss,Encoder Loss
Episode,Test Reward per step,Test Total Reward,Q Loss,Encoder Loss
Episode,Test Reward per step,Test Total Reward,Q Loss,Encoder Loss
Episode,Test Reward per step,Test Total Reward,Q Loss,Encoder Loss
Episode,Test Reward per step,Test Total Reward,Q Loss,Encoder Loss
Episode,Test Reward per step,Test Total Reward,Q Loss,Encoder Loss
Episode,Test Reward per step,Test Total Reward,Q Loss,Encoder Loss
Episode,Test Reward per step,Test Total Reward,Q Loss,Encoder Loss
1,-0.0202000006350378,-12.120000381022692,0.5134924542790356
2,-0.013000000584870558,-7.800000350922346,0.5829846101648789
Episode,Test Reward per step,Test Total Reward,Q Loss,Encoder Loss
1,-0.016916667393719158,-10.150000436231494,0.9131004715330494
2,-0.013583333917583026,-8.150000350549817,4.014862265765374
3,-0.024583333997676777,-14.750000398606062,0.7860787503289592
4,-0.021650000462929354,-12.990000277757645,0.4720204082339273
Episode,Test Reward per step,Test Total Reward,Q Loss,Encoder Loss
1,-0.017166667332251865,-10.30000039935112,0.6173376086401949
2,-0.024350000657141255,-14.610000394284725,1.2871421508844332
3,-0.013750000810250643,-8.250000486150384,0.6697964709757589
4,-0.027166667434697346,-16.30000046081841,0.5764425336660879
Episode,Test Reward per step,Test Total Reward,Q Loss,Encoder Loss
1,-0.019266667213911803,-11.560000328347087,0.6259022262336618
2,-0.008350000443557905,-5.010000266134739,5.042095000505374
3,-0.017416667376334467,-10.450000425800681,0.5876662034092616
4,-0.02616666728320221,-15.700000369921327,0.5297814458258618
Episode,Test Reward per step,Test Total Reward,Q Loss,Encoder Loss
1,-0.02991666739496092,-17.950000436976552,0.12877337246185389
2,-0.027666667448356747,-16.60000046901405,0.4466445219305377
3,-0.028500000769272445,-17.100000461563468,0.2864450327546942
4,-0.020583333993951482,-12.350000396370888,12.245569654966303
Episode,Test Reward per step,Test Total Reward,Q Loss
1,-0.0138888894725177,-12.500000525265932,4.672263254231182
2,-0.02462222279566873,-22.160000516101718,0.2884990447433257
3,-0.020444445096784173,-18.40000058710575,1.1497078214341243
4,-0.015777778399901264,-14.200000559911132,0.8200105993516784
Episode,Test Reward per step,Test Total Reward,Q Loss
1,-0.016080000463873124,-24.120000695809722,3.938892811305629
2,-0.0092666669972241,-13.900000495836139,4.786046176319218
3,-0.012926667129000022,-19.390000693500042,5.016167023518426
4,-0.018493333908418834,-27.74000086262822,4.4709069241215245
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
1,-0.014233333749075715,-21.350000623613596,3.855935144177071
Episode,Test Reward per step,Test Total Reward,Q Loss
1,-0.008513333849608897,-12.770000774413347,4.6186894706299295
2,-0.020480000669757543,-30.720001004636288,0.9844894802415216
3,-0.013066667165607188,-19.60000074841082,5.132481761838836
4,-0.010793333698064067,-16.190000547096133,3.303723068407857
Episode,Test Reward per step,Test Total Reward,Q Loss
1,-0.012566667168090734,-18.85000075213611,3.129182820673457
2,-0.011366667189945782,-17.050000784918666,4.83307322013206
3,-0.014426667125274711,-21.640000687912107,3.493385392978833
4,-0.007606667190790181,-11.410000786185265,2.8810071629823684
Episode,Test Reward per step,Test Total Reward,Q Loss
1,-0.011600000526756062,-17.400000790134072,6.510007922458228
2,-0.015400000628083955,-23.100000942125916,5.016244273394496
3,-0.01940000044430296,-29.100000666454434,6.5327909420774635
4,-0.015286667189250366,-22.930000783875585,7.301351223127974
Episode,Test Reward per step,Test Total Reward,Q Loss
1,-0.017633333863069586,-26.45000079460442,4.723755816795473
2,-0.0184000005622705,-27.600000843405724,5.1472105470954475
3,-0.01749333378300067,-26.24000067450106,6.187318619888354
4,-0.014193333916366069,-21.29000087454915,4.372770968092653
5,-0.012440000462035333,-18.660000693053007,6.705587154475912
6,-0.009520000455280151,-14.280000682920218,5.044945299204622
7,-0.01256666712214551,-18.85000068321824,3.6227991832479476
8,-0.012946667216718177,-19.420000825077295,4.7343459795095075
9,-0.011953333730498944,-17.930000595748425,4.37964290151462
10,-0.01590000061442455,-23.85000092163682,5.073054181778732
11,-0.018800000625352094,-28.200000938028097,6.4217221297469695
12,-0.009353333638360089,-14.030000457540154,2.326690824345633
13,-0.01113333398352066,-16.700000975281,4.088894226917782
14,-0.01877333383386332,-28.160000750795007,6.965291854854348
15,-0.008800000560780384,-13.20000084117055,6.716618712611441
16,-0.006506667185574764,-9.760000778362155,6.338816239727024
17,-0.013146667167544347,-19.720000751316547,5.3729539678646905
18,-0.01246666702876489,-18.700000543147326,3.045792233520615
19,-0.015480000466108305,-23.220000699162483,5.825426741973972
20,-0.010546667162328955,-15.820000743493438,5.155739172888348
21,-0.014360000568131588,-21.54000085219741,5.760099837235765
22,-0.013193333954860767,-19.79000093229115,3.4039871329562956
23,-0.012493333842605342,-18.74000076390803,6.1903340154980615
24,-0.019180000388373974,-28.770000582560897,8.856001470026799
25,-0.0048400004717210855,-7.260000707581639,4.43471647486869
26,-0.005100000241150463,-7.650000361725688,2.0701213867848063
27,-0.008060000479221348,-12.090000718832016,4.49394223410806
28,-0.01813333394502604,-27.200000917539,7.214098290217735
29,-0.014833333913236869,-22.250000869855285,4.590483085388257
30,-0.015446667176981732,-23.17000076547265,4.348702317768268
31,-0.012486667290329927,-18.7300009354949,5.459759096608507
32,-0.018873333974430927,-28.310000961646438,4.654146627557933
33,-0.010673333797603846,-16.01000069640577,3.8625871425653906
34,-0.009220000413556898,-13.83000062033534,6.231194434857544
35,-0.018886667191982235,-28.330000787973404,6.47520289880112
36,-0.012920000550647577,-19.380000825971365,4.811888993683196
37,-0.01721333382402854,-25.820000736042857,7.760760664732109
38,-0.01666666724657015,-25.000000869855285,5.955171101746863
39,-0.014193333819508522,-21.29000072926283,4.544590253053912
40,-0.012466667236139381,-18.700000854209065,5.458408982768921
41,-0.013653333819160857,-20.480000728741288,4.556887937451069
42,-0.014286667271206751,-21.430000906810164,3.751098855674642
43,-0.015946667237828168,-23.920000856742263,4.177117820975304
44,-0.01056666719416777,-15.85000079125166,4.95332936082556
45,-0.012726667137195653,-19.0900007057935,5.087166722076107
46,-0.011793333644668258,-17.690000467002392,4.1788316582722915
47,-0.013713333706061075,-20.570000559091568,7.788322448991352
48,-0.014066667222728337,-21.100000834092498,3.411615719742488
49,-0.009366667111714692,-14.050000667572021,8.506367806288537
50,-0.01563333389908075,-23.45000084862113,7.114352168325883
Episode,Test Reward per step,Test Total Reward,Q Loss
1,-0.005083333545053997,-15.250000635161996,4.0690177911984104
2,-0.0017800688730789588,-5.1800004206597805,5.247128358700801
3,-0.007693333643178146,-23.080000929534435,6.52815954385015
4,-0.00676666699287793,-20.30000097863376,7.152028998600009
5,-0.004670000258212284,-14.010000774636865,11.336737939413906
6,-0.007096666987364489,-21.290000962093472,5.624755771789628
7,-0.001956666850795349,-5.8700005523860455,8.644268418864495
8,-0.005133333653211591,-15.40000095963478,8.653161331177749
9,-0.008970000282550858,-26.910000847652555,4.9132782174147405
10,-0.004486666999757288,-13.46000099927187,6.408604541718168
11,-0.00283000027388334,-8.490000821650028,4.8490399657665995
12,-0.004140000335251288,-12.420001005753875,8.77624316112005
13,-0.0014633335278679911,-4.390000583603978,25.19092738425413
14,-0.003276666926220058,-9.830000778660178,5.291499710836837
15,-0.005980000387256345,-17.940001161769032,10.316609222477446
16,-0.006776667060951392,-20.330001182854176,5.231879151211019
17,-0.00870000035005311,-26.100001050159335,5.083763212642539
18,-0.007593333667765063,-22.780001003295183,5.938277710856843
19,-0.002070000216985742,-6.210000650957227,4.206157889257769
20,-0.002070000084737931,-6.21000025421381,5.155173649675296
21,-0.00014000018561879864,-0.4200005568563938,4.617884986477783
22,-0.0033266668537010676,-9.980000561103225,3.9722283499655937
23,-0.006516667064900196,-19.5500011947006,6.343596511256628
24,-0.00859333377269407,-25.780001318082213,4.519633306648428
25,-0.0057733336742967324,-17.32000102289021,8.632578533394488
26,-0.006080000325416526,-18.240000976249576,5.091030961399023
27,-0.0027733335569500965,-8.320000670850277,3.642865209649233
28,-0.01274666713053982,-38.240001391619444,5.983787242462287
29,-0.007010000328843793,-21.030000986531377,8.90549713997356
30,-0.005226666940997042,-15.680000822991133,8.857616423498653
31,-0.0011292776964009928,-2.9700003415346146,3.5895696628188043
32,-0.006033333695183196,-18.100001085549593,4.0521899498844975
33,-0.001493333617846171,-4.480000853538513,4.367968963913931
34,-0.0009100001621991408,-2.730000486597419,20.33450688049449
35,-0.006883333733926213,-20.65000120177865,4.428582752741727
36,-0.003990000224361819,-11.970000673085451,5.347212844775701
37,-0.0002900002729147668,-0.8700008187443018,11.013067101749403
38,-0.0008633335592846049,-2.5900006778538227,5.215288246104402
39,0.0025733331125229633,7.719999337568879,9.603697080070559
40,-0.00822333364002406,-24.670000920072198,12.400482628053584
41,-0.001603333519150811,-4.81000055745244,3.8035408607902372
42,-0.005620000327626864,-16.860000982880592,6.50861624105265
43,-0.009060000280539186,-27.180000841617584,6.014622391845945
44,-0.00899333356010416,-26.980000680312514,5.046779040676723
45,-0.006590000376105307,-19.770001128315926,6.143304929300761
46,-0.004900000236928461,-14.700000710785389,4.93075222342223
47,-0.008666667106250922,-26.000001318752766,10.330566445839054
48,-0.004950000385443373,-14.850001156330109,8.132347862971306
49,-0.0011300003274033474,-3.39000098221004,4.7150844008879655
50,-0.009943333777909484,-29.830001333728433,8.092762558676585
Episode,Test Reward per step,Test Total Reward,Q Loss
Episode,Test Reward per step,Test Total Reward,Q Loss
1,-0.010316667007282376,-24.760000817477703,5.389483116871746
2,-0.0068958336386519175,-16.5500007327646,5.126234294267838
3,-0.00427083378812919,-10.250001091510057,5.326486256430453
4,-0.003837500281321506,-9.210000675171614,5.3233375058803745
5,-0.007141667094547301,-17.140001026913524,5.471940371506152
6,-0.011608333700181295,-27.86000088043511,4.231081664823982
7,-0.010537500327142577,-25.290000785142183,3.65810068531941
8,-0.010550000482859711,-25.320001158863306,3.736380994256997
9,-0.01178750029609849,-28.290000710636377,7.637241010043745
10,-0.0040291670306275285,-9.67000087350607,6.313896968601068