bjarlestam commited on
Commit
c601067
·
1 Parent(s): db4f938

6.5 million steps

Browse files
SoccerTwos.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a643cbf7b2ac8d5478e93ccde9824c7b6fc525a66c00d6034f86fc3542f487a6
3
  size 2815689
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:938451bcaff44acbe51f407c436b7194c2536f33414a46d8c63a8ec4ebef6e4c
3
  size 2815689
SoccerTwos/{SoccerTwos-1999296.onnx → SoccerTwos-6555492.onnx} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ac47805af8d5542ee031595400e2556ed067c74675337a54764fdd6820a44bc7
3
  size 2815689
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:938451bcaff44acbe51f407c436b7194c2536f33414a46d8c63a8ec4ebef6e4c
3
  size 2815689
SoccerTwos/{SoccerTwos-1999296.pt → SoccerTwos-6555492.pt} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b7c86154f343e186e65f0e9b4a79f1f7f17a41fa98d0cb9a878f05650adcdf03
3
  size 34728689
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b24686f444a9a2ee6005e0fd0ff7cd1e4f3675c1c6be7372b906f496a971669
3
  size 34728689
SoccerTwos/checkpoint.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0603acde269a37bfb4e99f923fb838c0ea5533012c6a4a336945182df7c1331b
3
  size 34728689
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b24686f444a9a2ee6005e0fd0ff7cd1e4f3675c1c6be7372b906f496a971669
3
  size 34728689
SoccerTwos/events.out.tfevents.1683487711.CLM-FVFF611QQ05P.local.92718.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27550dbaccbad0cf343c9ddfc637656823ec6bdd24d93662738cef04f49c4a1c
3
+ size 381197
run_logs/Player-0.log CHANGED
@@ -10,7 +10,7 @@ NullGfxDevice:
10
  Renderer: Null Device
11
  Vendor: Unity Technologies
12
  Begin MonoManager ReloadAssembly
13
- - Completed reload, in 0.094 seconds
14
  ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
15
  ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
16
  ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
@@ -35,17 +35,16 @@ ERROR: Shader Standard shader is not supported on this GPU (none of subshaders/f
35
  WARNING: Shader Unsupported: 'Standard' - All subshaders removed
36
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
37
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
38
- UnloadTime: 0.641916 ms
39
  Registered Communicator in Agent.
40
  ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
41
- GRPC Exception: Status(StatusCode=Unknown, Detail="Exception calling application: [Errno 32] Broken pipe"). Disconnecting from trainer.
42
- Thread 0x17144f000 may have been prematurely finalized
43
  Setting up 4 worker threads for Enlighten.
44
  Memory Statistics:
45
  [ALLOC_TEMP_TLS] TLS Allocator
46
  StackAllocators :
47
  [ALLOC_TEMP_MAIN]
48
- Peak usage frame count: [8.0 KB-16.0 KB]: 14298 frames, [2.0 MB-4.0 MB]: 1 frames
49
  Initial Block Size 4.0 MB
50
  Current Block Size 4.0 MB
51
  Peak Allocated Bytes 2.1 MB
@@ -73,7 +72,7 @@ Memory Statistics:
73
  [ALLOC_TEMP_Job.Worker 0]
74
  Initial Block Size 256.0 KB
75
  Current Block Size 256.0 KB
76
- Peak Allocated Bytes 0 B
77
  Overflow Count 0
78
  [ALLOC_TEMP_Background Job.Worker 10]
79
  Initial Block Size 32.0 KB
@@ -196,22 +195,22 @@ Memory Statistics:
196
  Peak Allocated Bytes 0 B
197
  Overflow Count 0
198
  [ALLOC_DEFAULT] Dual Thread Allocator
199
- Peak main deferred allocation count 3
200
  [ALLOC_BUCKET]
201
  Large Block size 4.0 MB
202
  Used Block count 1
203
  Peak Allocated bytes 1.0 MB
204
  [ALLOC_DEFAULT_MAIN]
205
- Peak usage frame count: [4.0 MB-8.0 MB]: 14299 frames
206
  Requested Block Size 16.0 MB
207
  Peak Block count 1
208
- Peak Allocated memory 4.8 MB
209
  Peak Large allocation bytes 0 B
210
  [ALLOC_DEFAULT_THREAD]
211
- Peak usage frame count: [16.0 MB-32.0 MB]: 14299 frames
212
  Requested Block Size 16.0 MB
213
  Peak Block count 1
214
- Peak Allocated memory 17.5 MB
215
  Peak Large allocation bytes 16.0 MB
216
  [ALLOC_TEMP_JOB_1_FRAME]
217
  Initial Block Size 2.0 MB
@@ -240,13 +239,13 @@ Memory Statistics:
240
  Used Block count 1
241
  Peak Allocated bytes 1.0 MB
242
  [ALLOC_GFX_MAIN]
243
- Peak usage frame count: [32.0 KB-64.0 KB]: 14298 frames, [64.0 KB-128.0 KB]: 1 frames
244
  Requested Block Size 16.0 MB
245
  Peak Block count 1
246
  Peak Allocated memory 65.6 KB
247
  Peak Large allocation bytes 0 B
248
  [ALLOC_GFX_THREAD]
249
- Peak usage frame count: [128.0 KB-256.0 KB]: 14299 frames
250
  Requested Block Size 16.0 MB
251
  Peak Block count 1
252
  Peak Allocated memory 173.5 KB
@@ -258,13 +257,13 @@ Memory Statistics:
258
  Used Block count 1
259
  Peak Allocated bytes 1.0 MB
260
  [ALLOC_CACHEOBJECTS_MAIN]
261
- Peak usage frame count: [0.5 MB-1.0 MB]: 14299 frames
262
  Requested Block Size 4.0 MB
263
  Peak Block count 1
264
  Peak Allocated memory 0.6 MB
265
  Peak Large allocation bytes 0 B
266
  [ALLOC_CACHEOBJECTS_THREAD]
267
- Peak usage frame count: [0.5 MB-1.0 MB]: 14298 frames, [2.0 MB-4.0 MB]: 1 frames
268
  Requested Block Size 4.0 MB
269
  Peak Block count 1
270
  Peak Allocated memory 3.4 MB
@@ -276,13 +275,13 @@ Memory Statistics:
276
  Used Block count 1
277
  Peak Allocated bytes 1.0 MB
278
  [ALLOC_TYPETREE_MAIN]
279
- Peak usage frame count: [0-1.0 KB]: 14299 frames
280
  Requested Block Size 2.0 MB
281
  Peak Block count 1
282
  Peak Allocated memory 1.0 KB
283
  Peak Large allocation bytes 0 B
284
  [ALLOC_TYPETREE_THREAD]
285
- Peak usage frame count: [1.0 KB-2.0 KB]: 14298 frames, [2.0 KB-4.0 KB]: 1 frames
286
  Requested Block Size 2.0 MB
287
  Peak Block count 1
288
  Peak Allocated memory 2.2 KB
 
10
  Renderer: Null Device
11
  Vendor: Unity Technologies
12
  Begin MonoManager ReloadAssembly
13
+ - Completed reload, in 0.097 seconds
14
  ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
15
  ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
16
  ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 
35
  WARNING: Shader Unsupported: 'Standard' - All subshaders removed
36
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
37
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
38
+ UnloadTime: 1.679917 ms
39
  Registered Communicator in Agent.
40
  ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
41
+ Thread 0x16e6df000 may have been prematurely finalized
 
42
  Setting up 4 worker threads for Enlighten.
43
  Memory Statistics:
44
  [ALLOC_TEMP_TLS] TLS Allocator
45
  StackAllocators :
46
  [ALLOC_TEMP_MAIN]
47
+ Peak usage frame count: [8.0 KB-16.0 KB]: 6919 frames, [2.0 MB-4.0 MB]: 1 frames
48
  Initial Block Size 4.0 MB
49
  Current Block Size 4.0 MB
50
  Peak Allocated Bytes 2.1 MB
 
72
  [ALLOC_TEMP_Job.Worker 0]
73
  Initial Block Size 256.0 KB
74
  Current Block Size 256.0 KB
75
+ Peak Allocated Bytes 0.7 KB
76
  Overflow Count 0
77
  [ALLOC_TEMP_Background Job.Worker 10]
78
  Initial Block Size 32.0 KB
 
195
  Peak Allocated Bytes 0 B
196
  Overflow Count 0
197
  [ALLOC_DEFAULT] Dual Thread Allocator
198
+ Peak main deferred allocation count 2
199
  [ALLOC_BUCKET]
200
  Large Block size 4.0 MB
201
  Used Block count 1
202
  Peak Allocated bytes 1.0 MB
203
  [ALLOC_DEFAULT_MAIN]
204
+ Peak usage frame count: [4.0 MB-8.0 MB]: 6920 frames
205
  Requested Block Size 16.0 MB
206
  Peak Block count 1
207
+ Peak Allocated memory 5.0 MB
208
  Peak Large allocation bytes 0 B
209
  [ALLOC_DEFAULT_THREAD]
210
+ Peak usage frame count: [16.0 MB-32.0 MB]: 6920 frames
211
  Requested Block Size 16.0 MB
212
  Peak Block count 1
213
+ Peak Allocated memory 17.4 MB
214
  Peak Large allocation bytes 16.0 MB
215
  [ALLOC_TEMP_JOB_1_FRAME]
216
  Initial Block Size 2.0 MB
 
239
  Used Block count 1
240
  Peak Allocated bytes 1.0 MB
241
  [ALLOC_GFX_MAIN]
242
+ Peak usage frame count: [32.0 KB-64.0 KB]: 6919 frames, [64.0 KB-128.0 KB]: 1 frames
243
  Requested Block Size 16.0 MB
244
  Peak Block count 1
245
  Peak Allocated memory 65.6 KB
246
  Peak Large allocation bytes 0 B
247
  [ALLOC_GFX_THREAD]
248
+ Peak usage frame count: [128.0 KB-256.0 KB]: 6920 frames
249
  Requested Block Size 16.0 MB
250
  Peak Block count 1
251
  Peak Allocated memory 173.5 KB
 
257
  Used Block count 1
258
  Peak Allocated bytes 1.0 MB
259
  [ALLOC_CACHEOBJECTS_MAIN]
260
+ Peak usage frame count: [0.5 MB-1.0 MB]: 6920 frames
261
  Requested Block Size 4.0 MB
262
  Peak Block count 1
263
  Peak Allocated memory 0.6 MB
264
  Peak Large allocation bytes 0 B
265
  [ALLOC_CACHEOBJECTS_THREAD]
266
+ Peak usage frame count: [0.5 MB-1.0 MB]: 6919 frames, [2.0 MB-4.0 MB]: 1 frames
267
  Requested Block Size 4.0 MB
268
  Peak Block count 1
269
  Peak Allocated memory 3.4 MB
 
275
  Used Block count 1
276
  Peak Allocated bytes 1.0 MB
277
  [ALLOC_TYPETREE_MAIN]
278
+ Peak usage frame count: [0-1.0 KB]: 6920 frames
279
  Requested Block Size 2.0 MB
280
  Peak Block count 1
281
  Peak Allocated memory 1.0 KB
282
  Peak Large allocation bytes 0 B
283
  [ALLOC_TYPETREE_THREAD]
284
+ Peak usage frame count: [1.0 KB-2.0 KB]: 6919 frames, [2.0 KB-4.0 KB]: 1 frames
285
  Requested Block Size 2.0 MB
286
  Peak Block count 1
287
  Peak Allocated memory 2.2 KB
run_logs/timers.json CHANGED
@@ -2,201 +2,201 @@
2
  "name": "root",
3
  "gauges": {
4
  "SoccerTwos.Policy.Entropy.mean": {
5
- "value": 2.479091167449951,
6
- "min": 2.4658448696136475,
7
- "max": 2.58561635017395,
8
- "count": 76
9
  },
10
  "SoccerTwos.Policy.Entropy.sum": {
11
- "value": 49899.1484375,
12
- "min": 8394.09375,
13
- "max": 59788.078125,
14
- "count": 76
15
  },
16
  "SoccerTwos.Environment.EpisodeLength.mean": {
17
- "value": 55.18681318681319,
18
- "min": 35.1875,
19
- "max": 83.23728813559322,
20
- "count": 76
21
  },
22
  "SoccerTwos.Environment.EpisodeLength.sum": {
23
- "value": 20088.0,
24
- "min": 2252.0,
25
- "max": 20324.0,
26
- "count": 76
27
  },
28
  "SoccerTwos.Self-play.ELO.mean": {
29
- "value": 1649.8954830393834,
30
- "min": 1594.3697009364087,
31
- "max": 1650.8506175397752,
32
- "count": 76
33
  },
34
  "SoccerTwos.Self-play.ELO.sum": {
35
- "value": 300280.9779131678,
36
- "min": 51997.66731364747,
37
- "max": 331919.8479288847,
38
- "count": 76
39
  },
40
  "SoccerTwos.Step.mean": {
41
- "value": 6179996.0,
42
- "min": 5429978.0,
43
- "max": 6179996.0,
44
- "count": 76
45
  },
46
  "SoccerTwos.Step.sum": {
47
- "value": 6179996.0,
48
- "min": 5429978.0,
49
- "max": 6179996.0,
50
- "count": 76
51
  },
52
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
53
- "value": 0.07872677594423294,
54
- "min": -0.08215012401342392,
55
- "max": 0.08388468623161316,
56
- "count": 76
57
  },
58
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
59
- "value": 14.249547004699707,
60
- "min": -12.486818313598633,
61
- "max": 14.249547004699707,
62
- "count": 76
63
  },
64
  "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
65
- "value": 0.07752089947462082,
66
- "min": -0.08446293324232101,
67
- "max": 0.08493209630250931,
68
- "count": 76
69
  },
70
  "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
71
- "value": 14.031283378601074,
72
- "min": -12.83836555480957,
73
- "max": 14.031283378601074,
74
- "count": 76
75
  },
76
  "SoccerTwos.Environment.CumulativeReward.mean": {
77
  "value": 0.0,
78
  "min": 0.0,
79
  "max": 0.0,
80
- "count": 76
81
  },
82
  "SoccerTwos.Environment.CumulativeReward.sum": {
83
  "value": 0.0,
84
  "min": 0.0,
85
  "max": 0.0,
86
- "count": 76
87
  },
88
  "SoccerTwos.Policy.ExtrinsicReward.mean": {
89
- "value": 0.18952817383392082,
90
- "min": -0.30000479135684627,
91
- "max": 0.28260000117800455,
92
- "count": 76
93
  },
94
  "SoccerTwos.Policy.ExtrinsicReward.sum": {
95
- "value": 34.30459946393967,
96
- "min": -50.10080015659332,
97
- "max": 49.737600207328796,
98
- "count": 76
99
  },
100
  "SoccerTwos.Environment.GroupCumulativeReward.mean": {
101
- "value": 0.18952817383392082,
102
- "min": -0.30000479135684627,
103
- "max": 0.28260000117800455,
104
- "count": 76
105
  },
106
  "SoccerTwos.Environment.GroupCumulativeReward.sum": {
107
- "value": 34.30459946393967,
108
- "min": -50.10080015659332,
109
- "max": 49.737600207328796,
110
- "count": 76
111
  },
112
  "SoccerTwos.IsTraining.mean": {
113
  "value": 1.0,
114
  "min": 1.0,
115
  "max": 1.0,
116
- "count": 76
117
  },
118
  "SoccerTwos.IsTraining.sum": {
119
  "value": 1.0,
120
  "min": 1.0,
121
  "max": 1.0,
122
- "count": 76
123
  },
124
  "SoccerTwos.Losses.PolicyLoss.mean": {
125
- "value": 0.015399371163221076,
126
- "min": 0.011844274809118361,
127
- "max": 0.024232410235951345,
128
- "count": 36
129
  },
130
  "SoccerTwos.Losses.PolicyLoss.sum": {
131
- "value": 0.015399371163221076,
132
- "min": 0.011844274809118361,
133
- "max": 0.024232410235951345,
134
- "count": 36
135
  },
136
  "SoccerTwos.Losses.ValueLoss.mean": {
137
- "value": 0.06767735456426939,
138
- "min": 0.055261904994646706,
139
- "max": 0.06967596064011256,
140
- "count": 36
141
  },
142
  "SoccerTwos.Losses.ValueLoss.sum": {
143
- "value": 0.06767735456426939,
144
- "min": 0.055261904994646706,
145
- "max": 0.06967596064011256,
146
- "count": 36
147
  },
148
  "SoccerTwos.Losses.BaselineLoss.mean": {
149
- "value": 0.0684792855133613,
150
- "min": 0.05549707127114137,
151
- "max": 0.0708642177283764,
152
- "count": 36
153
  },
154
  "SoccerTwos.Losses.BaselineLoss.sum": {
155
- "value": 0.0684792855133613,
156
- "min": 0.05549707127114137,
157
- "max": 0.0708642177283764,
158
- "count": 36
159
  },
160
  "SoccerTwos.Policy.LearningRate.mean": {
161
  "value": 0.00025000000000000006,
162
  "min": 0.00025000000000000006,
163
  "max": 0.00025000000000000006,
164
- "count": 36
165
  },
166
  "SoccerTwos.Policy.LearningRate.sum": {
167
  "value": 0.00025000000000000006,
168
  "min": 0.00025000000000000006,
169
  "max": 0.00025000000000000006,
170
- "count": 36
171
  },
172
  "SoccerTwos.Policy.Epsilon.mean": {
173
  "value": 0.25,
174
  "min": 0.25,
175
  "max": 0.25,
176
- "count": 36
177
  },
178
  "SoccerTwos.Policy.Epsilon.sum": {
179
  "value": 0.25,
180
  "min": 0.25,
181
  "max": 0.25,
182
- "count": 36
183
  },
184
  "SoccerTwos.Policy.Beta.mean": {
185
  "value": 0.010000000000000002,
186
  "min": 0.010000000000000002,
187
  "max": 0.010000000000000002,
188
- "count": 36
189
  },
190
  "SoccerTwos.Policy.Beta.sum": {
191
  "value": 0.010000000000000002,
192
  "min": 0.010000000000000002,
193
  "max": 0.010000000000000002,
194
- "count": 36
195
  }
196
  },
197
  "metadata": {
198
  "timer_format_version": "0.1.0",
199
- "start_time_seconds": "1683484175",
200
  "python_version": "3.9.16 | packaged by conda-forge | (main, Feb 1 2023, 21:38:11) \n[Clang 14.0.6 ]",
201
  "command_line_arguments": "/Users/andreas.bjarlestam/mambaforge/envs/huggingface-rl-course/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.app --run-id=SoccerTwos --no-graphics --resume",
202
  "mlagents_version": "0.31.0.dev0",
@@ -204,103 +204,103 @@
204
  "communication_protocol_version": "1.5.0",
205
  "pytorch_version": "1.11.0",
206
  "numpy_version": "1.21.2",
207
- "end_time_seconds": "1683487657"
208
  },
209
- "total": 3481.642826833,
210
  "count": 1,
211
- "self": 0.266701749999811,
212
  "children": {
213
  "run_training.setup": {
214
- "total": 0.03880720800000015,
215
  "count": 1,
216
- "self": 0.03880720800000015
217
  },
218
  "TrainerController.start_learning": {
219
- "total": 3481.3373178750003,
220
  "count": 1,
221
- "self": 0.7055969289958739,
222
  "children": {
223
  "TrainerController._reset_env": {
224
- "total": 1.8457452910002883,
225
- "count": 5,
226
- "self": 1.8457452910002883
227
  },
228
  "TrainerController.advance": {
229
- "total": 3478.6461231130047,
230
- "count": 52567,
231
- "self": 0.5951379080393053,
232
  "children": {
233
  "env_step": {
234
- "total": 2799.831084738981,
235
- "count": 52567,
236
- "self": 2701.921003805895,
237
  "children": {
238
  "SubprocessEnvManager._take_step": {
239
- "total": 97.46038615304738,
240
- "count": 52567,
241
- "self": 2.8379347090271096,
242
  "children": {
243
  "TorchPolicy.evaluate": {
244
- "total": 94.62245144402027,
245
- "count": 95322,
246
- "self": 94.62245144402027
247
  }
248
  }
249
  },
250
  "workers": {
251
- "total": 0.4496947800386013,
252
- "count": 52566,
253
  "self": 0.0,
254
  "children": {
255
  "worker_root": {
256
- "total": 3478.3395808320347,
257
- "count": 52566,
258
  "is_parallel": true,
259
- "self": 853.5667974280468,
260
  "children": {
261
  "steps_from_proto": {
262
- "total": 0.00852233499997479,
263
- "count": 10,
264
  "is_parallel": true,
265
- "self": 0.0010013339999064286,
266
  "children": {
267
  "_process_rank_one_or_two_observation": {
268
- "total": 0.007521001000068361,
269
- "count": 40,
270
  "is_parallel": true,
271
- "self": 0.007521001000068361
272
  }
273
  }
274
  },
275
  "UnityEnvironment.step": {
276
- "total": 2624.7642610689877,
277
- "count": 52566,
278
  "is_parallel": true,
279
- "self": 7.129942069017943,
280
  "children": {
281
  "UnityEnvironment._generate_step_input": {
282
- "total": 47.107922168025965,
283
- "count": 52566,
284
  "is_parallel": true,
285
- "self": 47.107922168025965
286
  },
287
  "communicator.exchange": {
288
- "total": 2473.9557799219765,
289
- "count": 52566,
290
  "is_parallel": true,
291
- "self": 2473.9557799219765
292
  },
293
  "steps_from_proto": {
294
- "total": 96.57061690996699,
295
- "count": 105132,
296
  "is_parallel": true,
297
- "self": 10.97493528192777,
298
  "children": {
299
  "_process_rank_one_or_two_observation": {
300
- "total": 85.59568162803922,
301
- "count": 420528,
302
  "is_parallel": true,
303
- "self": 85.59568162803922
304
  }
305
  }
306
  }
@@ -313,31 +313,24 @@
313
  }
314
  },
315
  "trainer_advance": {
316
- "total": 678.2199004659842,
317
- "count": 52566,
318
- "self": 4.748937736947255,
319
  "children": {
320
  "process_trajectory": {
321
- "total": 134.27234868403667,
322
- "count": 52566,
323
- "self": 134.07668543403662,
324
- "children": {
325
- "RLTrainer._checkpoint": {
326
- "total": 0.19566325000005236,
327
- "count": 1,
328
- "self": 0.19566325000005236
329
- }
330
- }
331
  },
332
  "_update_policy": {
333
- "total": 539.1986140450002,
334
- "count": 36,
335
- "self": 65.58856171399077,
336
  "children": {
337
  "TorchPOCAOptimizer.update": {
338
- "total": 473.61005233100946,
339
- "count": 1080,
340
- "self": 473.61005233100946
341
  }
342
  }
343
  }
@@ -346,19 +339,19 @@
346
  }
347
  },
348
  "trainer_threads": {
349
- "total": 4.5899969336460344e-07,
350
  "count": 1,
351
- "self": 4.5899969336460344e-07
352
  },
353
  "TrainerController._save_models": {
354
- "total": 0.13985208299982332,
355
  "count": 1,
356
- "self": 0.003031791000012163,
357
  "children": {
358
  "RLTrainer._checkpoint": {
359
- "total": 0.13682029199981116,
360
  "count": 1,
361
- "self": 0.13682029199981116
362
  }
363
  }
364
  }
 
2
  "name": "root",
3
  "gauges": {
4
  "SoccerTwos.Policy.Entropy.mean": {
5
+ "value": 2.503404140472412,
6
+ "min": 2.4523873329162598,
7
+ "max": 2.5370821952819824,
8
+ "count": 37
9
  },
10
  "SoccerTwos.Policy.Entropy.sum": {
11
+ "value": 47905.140625,
12
+ "min": 16055.9697265625,
13
+ "max": 55159.47265625,
14
+ "count": 37
15
  },
16
  "SoccerTwos.Environment.EpisodeLength.mean": {
17
+ "value": 64.93333333333334,
18
+ "min": 49.91752577319588,
19
+ "max": 76.84375,
20
+ "count": 37
21
  },
22
  "SoccerTwos.Environment.EpisodeLength.sum": {
23
+ "value": 19480.0,
24
+ "min": 4772.0,
25
+ "max": 20184.0,
26
+ "count": 37
27
  },
28
  "SoccerTwos.Self-play.ELO.mean": {
29
+ "value": 1652.4748588887048,
30
+ "min": 1642.8951631352754,
31
+ "max": 1669.7917318437467,
32
+ "count": 37
33
  },
34
  "SoccerTwos.Self-play.ELO.sum": {
35
+ "value": 247871.2288333057,
36
+ "min": 76077.51671093542,
37
+ "max": 321056.13316160464,
38
+ "count": 37
39
  },
40
  "SoccerTwos.Step.mean": {
41
+ "value": 6549982.0,
42
+ "min": 6189948.0,
43
+ "max": 6549982.0,
44
+ "count": 37
45
  },
46
  "SoccerTwos.Step.sum": {
47
+ "value": 6549982.0,
48
+ "min": 6189948.0,
49
+ "max": 6549982.0,
50
+ "count": 37
51
  },
52
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
53
+ "value": 0.051142871379852295,
54
+ "min": -0.06000871956348419,
55
+ "max": 0.0756918340921402,
56
+ "count": 37
57
  },
58
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
59
+ "value": 7.671430587768555,
60
+ "min": -9.386945724487305,
61
+ "max": 12.262077331542969,
62
+ "count": 37
63
  },
64
  "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
65
+ "value": 0.05099420249462128,
66
+ "min": -0.05922776460647583,
67
+ "max": 0.07353535294532776,
68
+ "count": 37
69
  },
70
  "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
71
+ "value": 7.649130344390869,
72
+ "min": -9.559730529785156,
73
+ "max": 11.912727355957031,
74
+ "count": 37
75
  },
76
  "SoccerTwos.Environment.CumulativeReward.mean": {
77
  "value": 0.0,
78
  "min": 0.0,
79
  "max": 0.0,
80
+ "count": 37
81
  },
82
  "SoccerTwos.Environment.CumulativeReward.sum": {
83
  "value": 0.0,
84
  "min": 0.0,
85
  "max": 0.0,
86
+ "count": 37
87
  },
88
  "SoccerTwos.Policy.ExtrinsicReward.mean": {
89
+ "value": 0.07690666834513346,
90
+ "min": -0.2579976199638276,
91
+ "max": 0.22876027267273158,
92
+ "count": 37
93
  },
94
  "SoccerTwos.Policy.ExtrinsicReward.sum": {
95
+ "value": 11.53600025177002,
96
+ "min": -43.343600153923035,
97
+ "max": 35.7960000038147,
98
+ "count": 37
99
  },
100
  "SoccerTwos.Environment.GroupCumulativeReward.mean": {
101
+ "value": 0.07690666834513346,
102
+ "min": -0.2579976199638276,
103
+ "max": 0.22876027267273158,
104
+ "count": 37
105
  },
106
  "SoccerTwos.Environment.GroupCumulativeReward.sum": {
107
+ "value": 11.53600025177002,
108
+ "min": -43.343600153923035,
109
+ "max": 35.7960000038147,
110
+ "count": 37
111
  },
112
  "SoccerTwos.IsTraining.mean": {
113
  "value": 1.0,
114
  "min": 1.0,
115
  "max": 1.0,
116
+ "count": 37
117
  },
118
  "SoccerTwos.IsTraining.sum": {
119
  "value": 1.0,
120
  "min": 1.0,
121
  "max": 1.0,
122
+ "count": 37
123
  },
124
  "SoccerTwos.Losses.PolicyLoss.mean": {
125
+ "value": 0.013742929190630093,
126
+ "min": 0.013162332853729216,
127
+ "max": 0.021872061599666873,
128
+ "count": 17
129
  },
130
  "SoccerTwos.Losses.PolicyLoss.sum": {
131
+ "value": 0.013742929190630093,
132
+ "min": 0.013162332853729216,
133
+ "max": 0.021872061599666873,
134
+ "count": 17
135
  },
136
  "SoccerTwos.Losses.ValueLoss.mean": {
137
+ "value": 0.060539432987570765,
138
+ "min": 0.05456341157356898,
139
+ "max": 0.06828681615491708,
140
+ "count": 17
141
  },
142
  "SoccerTwos.Losses.ValueLoss.sum": {
143
+ "value": 0.060539432987570765,
144
+ "min": 0.05456341157356898,
145
+ "max": 0.06828681615491708,
146
+ "count": 17
147
  },
148
  "SoccerTwos.Losses.BaselineLoss.mean": {
149
+ "value": 0.06114285662770271,
150
+ "min": 0.05531582894424598,
151
+ "max": 0.0692600845048825,
152
+ "count": 17
153
  },
154
  "SoccerTwos.Losses.BaselineLoss.sum": {
155
+ "value": 0.06114285662770271,
156
+ "min": 0.05531582894424598,
157
+ "max": 0.0692600845048825,
158
+ "count": 17
159
  },
160
  "SoccerTwos.Policy.LearningRate.mean": {
161
  "value": 0.00025000000000000006,
162
  "min": 0.00025000000000000006,
163
  "max": 0.00025000000000000006,
164
+ "count": 17
165
  },
166
  "SoccerTwos.Policy.LearningRate.sum": {
167
  "value": 0.00025000000000000006,
168
  "min": 0.00025000000000000006,
169
  "max": 0.00025000000000000006,
170
+ "count": 17
171
  },
172
  "SoccerTwos.Policy.Epsilon.mean": {
173
  "value": 0.25,
174
  "min": 0.25,
175
  "max": 0.25,
176
+ "count": 17
177
  },
178
  "SoccerTwos.Policy.Epsilon.sum": {
179
  "value": 0.25,
180
  "min": 0.25,
181
  "max": 0.25,
182
+ "count": 17
183
  },
184
  "SoccerTwos.Policy.Beta.mean": {
185
  "value": 0.010000000000000002,
186
  "min": 0.010000000000000002,
187
  "max": 0.010000000000000002,
188
+ "count": 17
189
  },
190
  "SoccerTwos.Policy.Beta.sum": {
191
  "value": 0.010000000000000002,
192
  "min": 0.010000000000000002,
193
  "max": 0.010000000000000002,
194
+ "count": 17
195
  }
196
  },
197
  "metadata": {
198
  "timer_format_version": "0.1.0",
199
+ "start_time_seconds": "1683487709",
200
  "python_version": "3.9.16 | packaged by conda-forge | (main, Feb 1 2023, 21:38:11) \n[Clang 14.0.6 ]",
201
  "command_line_arguments": "/Users/andreas.bjarlestam/mambaforge/envs/huggingface-rl-course/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.app --run-id=SoccerTwos --no-graphics --resume",
202
  "mlagents_version": "0.31.0.dev0",
 
204
  "communication_protocol_version": "1.5.0",
205
  "pytorch_version": "1.11.0",
206
  "numpy_version": "1.21.2",
207
+ "end_time_seconds": "1683489353"
208
  },
209
+ "total": 1643.169040458,
210
  "count": 1,
211
+ "self": 0.11722787500002596,
212
  "children": {
213
  "run_training.setup": {
214
+ "total": 0.013663792000000008,
215
  "count": 1,
216
+ "self": 0.013663792000000008
217
  },
218
  "TrainerController.start_learning": {
219
+ "total": 1643.038148791,
220
  "count": 1,
221
+ "self": 0.31101058200579246,
222
  "children": {
223
  "TrainerController._reset_env": {
224
+ "total": 2.2248240839999744,
225
+ "count": 3,
226
+ "self": 2.2248240839999744
227
  },
228
  "TrainerController.advance": {
229
+ "total": 1640.320858083994,
230
+ "count": 25389,
231
+ "self": 0.2661743909673078,
232
  "children": {
233
  "env_step": {
234
+ "total": 1330.830156340017,
235
+ "count": 25389,
236
+ "self": 1284.3852757490256,
237
  "children": {
238
  "SubprocessEnvManager._take_step": {
239
+ "total": 46.23812745699054,
240
+ "count": 25389,
241
+ "self": 1.2487462569900671,
242
  "children": {
243
  "TorchPolicy.evaluate": {
244
+ "total": 44.98938120000047,
245
+ "count": 46132,
246
+ "self": 44.98938120000047
247
  }
248
  }
249
  },
250
  "workers": {
251
+ "total": 0.20675313400085837,
252
+ "count": 25388,
253
  "self": 0.0,
254
  "children": {
255
  "worker_root": {
256
+ "total": 1640.2869981199963,
257
+ "count": 25388,
258
  "is_parallel": true,
259
+ "self": 393.89563319499894,
260
  "children": {
261
  "steps_from_proto": {
262
+ "total": 0.005132874999992598,
263
+ "count": 6,
264
  "is_parallel": true,
265
+ "self": 0.0006161679999161507,
266
  "children": {
267
  "_process_rank_one_or_two_observation": {
268
+ "total": 0.0045167070000764475,
269
+ "count": 24,
270
  "is_parallel": true,
271
+ "self": 0.0045167070000764475
272
  }
273
  }
274
  },
275
  "UnityEnvironment.step": {
276
+ "total": 1246.3862320499973,
277
+ "count": 25388,
278
  "is_parallel": true,
279
+ "self": 3.1823133230072926,
280
  "children": {
281
  "UnityEnvironment._generate_step_input": {
282
+ "total": 22.304695663003482,
283
+ "count": 25388,
284
  "is_parallel": true,
285
+ "self": 22.304695663003482
286
  },
287
  "communicator.exchange": {
288
+ "total": 1175.0904308869885,
289
+ "count": 25388,
290
  "is_parallel": true,
291
+ "self": 1175.0904308869885
292
  },
293
  "steps_from_proto": {
294
+ "total": 45.808792176997834,
295
+ "count": 50776,
296
  "is_parallel": true,
297
+ "self": 5.091343413956125,
298
  "children": {
299
  "_process_rank_one_or_two_observation": {
300
+ "total": 40.71744876304171,
301
+ "count": 203104,
302
  "is_parallel": true,
303
+ "self": 40.71744876304171
304
  }
305
  }
306
  }
 
313
  }
314
  },
315
  "trainer_advance": {
316
+ "total": 309.2245273530094,
317
+ "count": 25388,
318
+ "self": 2.159055672025943,
319
  "children": {
320
  "process_trajectory": {
321
+ "total": 68.22423439098337,
322
+ "count": 25388,
323
+ "self": 68.22423439098337
 
 
 
 
 
 
 
324
  },
325
  "_update_policy": {
326
+ "total": 238.8412372900001,
327
+ "count": 17,
328
+ "self": 29.788104290999627,
329
  "children": {
330
  "TorchPOCAOptimizer.update": {
331
+ "total": 209.05313299900047,
332
+ "count": 510,
333
+ "self": 209.05313299900047
334
  }
335
  }
336
  }
 
339
  }
340
  },
341
  "trainer_threads": {
342
+ "total": 4.1600014810683206e-07,
343
  "count": 1,
344
+ "self": 4.1600014810683206e-07
345
  },
346
  "TrainerController._save_models": {
347
+ "total": 0.18145562500012602,
348
  "count": 1,
349
+ "self": 0.0011100420001639577,
350
  "children": {
351
  "RLTrainer._checkpoint": {
352
+ "total": 0.18034558299996206,
353
  "count": 1,
354
+ "self": 0.18034558299996206
355
  }
356
  }
357
  }
run_logs/training_status.json CHANGED
@@ -1,16 +1,7 @@
1
  {
2
  "SoccerTwos": {
3
- "elo": 1653.8590589333792,
4
  "checkpoints": [
5
- {
6
- "steps": 1999296,
7
- "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-1999296.onnx",
8
- "reward": 0.0,
9
- "creation_time": 1683415133.0676868,
10
- "auxillary_file_paths": [
11
- "results/SoccerTwos/SoccerTwos/SoccerTwos-1999296.pt"
12
- ]
13
- },
14
  {
15
  "steps": 3999978,
16
  "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-3999978.onnx",
@@ -46,15 +37,24 @@
46
  "auxillary_file_paths": [
47
  "results/SoccerTwos/SoccerTwos/SoccerTwos-6187920.pt"
48
  ]
 
 
 
 
 
 
 
 
 
49
  }
50
  ],
51
  "final_checkpoint": {
52
- "steps": 6187920,
53
  "file_path": "results/SoccerTwos/SoccerTwos.onnx",
54
  "reward": 0.0,
55
- "creation_time": 1683487656.9546309,
56
  "auxillary_file_paths": [
57
- "results/SoccerTwos/SoccerTwos/SoccerTwos-6187920.pt"
58
  ]
59
  }
60
  },
 
1
  {
2
  "SoccerTwos": {
3
+ "elo": 1655.486498013031,
4
  "checkpoints": [
 
 
 
 
 
 
 
 
 
5
  {
6
  "steps": 3999978,
7
  "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-3999978.onnx",
 
37
  "auxillary_file_paths": [
38
  "results/SoccerTwos/SoccerTwos/SoccerTwos-6187920.pt"
39
  ]
40
+ },
41
+ {
42
+ "steps": 6555492,
43
+ "file_path": "results/SoccerTwos/SoccerTwos/SoccerTwos-6555492.onnx",
44
+ "reward": 0.0,
45
+ "creation_time": 1683489352.9770849,
46
+ "auxillary_file_paths": [
47
+ "results/SoccerTwos/SoccerTwos/SoccerTwos-6555492.pt"
48
+ ]
49
  }
50
  ],
51
  "final_checkpoint": {
52
+ "steps": 6555492,
53
  "file_path": "results/SoccerTwos/SoccerTwos.onnx",
54
  "reward": 0.0,
55
+ "creation_time": 1683489352.9770849,
56
  "auxillary_file_paths": [
57
+ "results/SoccerTwos/SoccerTwos/SoccerTwos-6555492.pt"
58
  ]
59
  }
60
  },