-
Notifications
You must be signed in to change notification settings - Fork 0
/
q2_dagger_ant.csv
We can make this file beautiful and searchable if this error is corrected: No commas found in this CSV file in line 0.
170 lines (170 loc) · 4.58 KB
/
q2_dagger_ant.csv
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
train_ep_lens_Average: 1000.0
train_ep_lens_Std: 0.0
train_ep_lens_Median: 1000.0
train_ep_lens_Min: 1000
train_ep_lens_Max: 1000
eval_ep_lens_Average: 1000.0
eval_ep_lens_Std: 0.0
eval_ep_lens_Median: 1000.0
eval_ep_lens_Min: 1000
eval_ep_lens_Max: 1000
train_returns_Average: 4713.6533
train_returns_Std: 12.196533
train_returns_Median: 4713.6533
train_returns_Min: 4701.4565
train_returns_Max: 4725.8496
eval_returns_Average: 2669.5461
eval_returns_Std: 1798.3542
eval_returns_Median: 2669.5461
eval_returns_Min: 871.19196
eval_returns_Max: 4467.9004
Train_EnvstepsSoFar: 0
TimeSinceStart: 5.798490524291992
Training Loss: 0.0016225475
reward_Average: 4.713653
reward_Std: 1.0507793
reward_Median: 4.807543
reward_Min: -1.6958617
reward_Max: 7.336165
eval_reward_Average: 2.6695461
eval_reward_Std: 1.912805
eval_reward_Median: 1.3043379
eval_reward_Min: -1.5003492
eval_reward_Max: 6.852286
Initial_DataCollection_AverageReturn: 4713.6533
train_ep_lens_Average: 1000.0
train_ep_lens_Std: 0.0
train_ep_lens_Median: 1000.0
train_ep_lens_Min: 1000
train_ep_lens_Max: 1000
eval_ep_lens_Average: 1000.0
eval_ep_lens_Std: 0.0
eval_ep_lens_Median: 1000.0
eval_ep_lens_Min: 1000
eval_ep_lens_Max: 1000
train_returns_Average: 4274.328
train_returns_Std: 0.0
train_returns_Median: 4274.328
train_returns_Min: 4274.328
train_returns_Max: 4274.328
eval_returns_Average: 4860.4736
eval_returns_Std: 16.900146
eval_returns_Median: 4860.4736
eval_returns_Min: 4843.573
eval_returns_Max: 4877.3735
Train_EnvstepsSoFar: 1000
TimeSinceStart: 10.007219552993774
Training Loss: 0.0010460976
reward_Average: 4.274328
reward_Std: 0.8239454
reward_Median: 4.2998734
reward_Min: -1.5688443
reward_Max: 6.6594625
eval_reward_Average: 4.8604736
eval_reward_Std: 0.9300238
eval_reward_Median: 4.920723
eval_reward_Min: -1.2025744
eval_reward_Max: 7.205182
Initial_DataCollection_AverageReturn: 4713.6533
train_ep_lens_Average: 1000.0
train_ep_lens_Std: 0.0
train_ep_lens_Median: 1000.0
train_ep_lens_Min: 1000
train_ep_lens_Max: 1000
eval_ep_lens_Average: 1000.0
eval_ep_lens_Std: 0.0
eval_ep_lens_Median: 1000.0
eval_ep_lens_Min: 1000
eval_ep_lens_Max: 1000
train_returns_Average: 4865.9326
train_returns_Std: 0.0
train_returns_Median: 4865.9326
train_returns_Min: 4865.9326
train_returns_Max: 4865.9326
eval_returns_Average: 4854.068
eval_returns_Std: 154.9253
eval_returns_Median: 4854.068
eval_returns_Min: 4699.1426
eval_returns_Max: 5008.993
Train_EnvstepsSoFar: 2000
TimeSinceStart: 14.347546815872192
Training Loss: 0.0005845155
reward_Average: 4.8659325
reward_Std: 0.9096779
reward_Median: 4.927509
reward_Min: -1.2004149
reward_Max: 7.2841744
eval_reward_Average: 4.854068
eval_reward_Std: 0.99549216
eval_reward_Median: 4.9275723
eval_reward_Min: -1.3141468
eval_reward_Max: 7.313232
Initial_DataCollection_AverageReturn: 4713.6533
train_ep_lens_Average: 1000.0
train_ep_lens_Std: 0.0
train_ep_lens_Median: 1000.0
train_ep_lens_Min: 1000
train_ep_lens_Max: 1000
eval_ep_lens_Average: 1000.0
eval_ep_lens_Std: 0.0
eval_ep_lens_Median: 1000.0
eval_ep_lens_Min: 1000
eval_ep_lens_Max: 1000
train_returns_Average: 4588.949
train_returns_Std: 0.0
train_returns_Median: 4588.949
train_returns_Min: 4588.949
train_returns_Max: 4588.949
eval_returns_Average: 4623.982
eval_returns_Std: 118.92041
eval_returns_Median: 4623.982
eval_returns_Min: 4505.0615
eval_returns_Max: 4742.9023
Train_EnvstepsSoFar: 3000
TimeSinceStart: 18.68288516998291
Training Loss: 0.00080293807
reward_Average: 4.588949
reward_Std: 1.0410414
reward_Median: 4.6973133
reward_Min: -1.2978941
reward_Max: 7.020527
eval_reward_Average: 4.623982
eval_reward_Std: 0.9830901
eval_reward_Median: 4.6673098
eval_reward_Min: -0.9474206
eval_reward_Max: 7.558122
Initial_DataCollection_AverageReturn: 4713.6533
train_ep_lens_Average: 1000.0
train_ep_lens_Std: 0.0
train_ep_lens_Median: 1000.0
train_ep_lens_Min: 1000
train_ep_lens_Max: 1000
eval_ep_lens_Average: 1000.0
eval_ep_lens_Std: 0.0
eval_ep_lens_Median: 1000.0
eval_ep_lens_Min: 1000
eval_ep_lens_Max: 1000
train_returns_Average: 4638.1636
train_returns_Std: 0.0
train_returns_Median: 4638.1636
train_returns_Min: 4638.1636
train_returns_Max: 4638.1636
eval_returns_Average: 4715.9062
eval_returns_Std: 75.51245
eval_returns_Median: 4715.9062
eval_returns_Min: 4640.394
eval_returns_Max: 4791.419
Train_EnvstepsSoFar: 4000
TimeSinceStart: 22.875478506088257
Training Loss: 0.000618203
reward_Average: 4.6381636
reward_Std: 0.9515305
reward_Median: 4.698634
reward_Min: -1.0876839
reward_Max: 7.161714
eval_reward_Average: 4.715906
eval_reward_Std: 1.1260725
eval_reward_Median: 4.894759
eval_reward_Min: -1.2903768
eval_reward_Max: 7.5141764
Initial_DataCollection_AverageReturn: 4713.6533