rng0x17 commited on
Commit
68b5be9
·
1 Parent(s): 7cd0694
SoccerTwos.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:202d27e9b185d21c323ee28ace81dfb33f1c3ecaca500eb0fad56d4c8da1b1db
3
  size 2815689
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:693e78241b1c621eb93840614cc30d6774aae00e0a21ee2ba50c41320a9f0cba
3
  size 2815689
SoccerTwos/SoccerTwos-27499864.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:4e64a090b692673693a3117b17b0489487a39ec4f7715d09cd5c0739418ea3ad
3
- size 34728689
 
 
 
 
SoccerTwos/SoccerTwos-27999982.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:1344942dab22c6e7ff69dc58293fa8e966d7c4c37384c73582c64079f205b436
3
- size 34728689
 
 
 
 
SoccerTwos/SoccerTwos-28477740.onnx DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:202d27e9b185d21c323ee28ace81dfb33f1c3ecaca500eb0fad56d4c8da1b1db
3
- size 2815689
 
 
 
 
SoccerTwos/SoccerTwos-28477740.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:b45e82a0ecf22630c5a3a855bd4421054dc4baee92da623a59a52ce074e6ce4d
3
- size 34728689
 
 
 
 
SoccerTwos/{SoccerTwos-26499995.onnx → SoccerTwos-31999878.onnx} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d2ce18e5f4c53b1dd5c379fa8822348c8065ccdae2769a9a4db7503ff68d522e
3
  size 2815689
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2523ce43e63cbd68fc969bc3fcf28dad06cba673f5e3d6a3254c27173e051aef
3
  size 2815689
SoccerTwos/{SoccerTwos-26499995.pt → SoccerTwos-31999878.pt} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:be60d96bf0a8fcc51db2e308530bdc753106dd18bfb300db95dbdf75e1564bf0
3
- size 34728689
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e826095b182fc6be7f89d0abf6955e86f652c2867540092e02203ae9e2a5860f
3
+ size 35525901
SoccerTwos/{SoccerTwos-27499864.onnx → SoccerTwos-32499928.onnx} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2d439691acfe5223f9548ef594388216f78634665d706eb087be7108a06048a5
3
  size 2815689
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d1f31fb6ea15cd9042054c000696cbbcfb927df8fc33463acaac6c4c818ef2f
3
  size 2815689
SoccerTwos/{SoccerTwos-26999977.pt → SoccerTwos-32499928.pt} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ecb2c7ab1fe045868b5dbf4de308c9dcb328b9e6dc27ac09506e4d922599dd7a
3
- size 34728689
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb3b5e6795c6808a6b1c5f3ff401483df0d2efca9b27d5bb191f4764fd1dfaad
3
+ size 35525901
SoccerTwos/{SoccerTwos-26999977.onnx → SoccerTwos-32999999.onnx} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:78f368728b0a1e786778e6d82352a6901eb152e5ebd56cebb82f13c117cb210c
3
  size 2815689
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80e9bf911d475e6a0eb9bd23f9d44ebed1e1658acf51945e75c7782ffd5268af
3
  size 2815689
SoccerTwos/SoccerTwos-32999999.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:605980ab99386002a6e8058bb25cf1dbc9afe2d9309e50d6c62f1197fb5aa7c0
3
+ size 35525901
SoccerTwos/{SoccerTwos-27999982.onnx → SoccerTwos-33499982.onnx} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c188b966c85ecccfe488de2995a282941c551e9a93648a5fd0b3bf40ccd41108
3
  size 2815689
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ba39e2a4ecad130abeb21d661f822cb70b6af2369e0d51f2781c7396b73cd62
3
  size 2815689
SoccerTwos/SoccerTwos-33499982.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29b02564f86db0026ca1f1d41845e9b5cb0a491ee6d507baae7e9bc161076534
3
+ size 35525901
SoccerTwos/SoccerTwos-33646596.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:693e78241b1c621eb93840614cc30d6774aae00e0a21ee2ba50c41320a9f0cba
3
+ size 2815689
SoccerTwos/SoccerTwos-33646596.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d8dd78178fede114090ae8138e9fcf2c23e1de7efed7d9567e9eee82e78b11b
3
+ size 35525901
SoccerTwos/checkpoint.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b45e82a0ecf22630c5a3a855bd4421054dc4baee92da623a59a52ce074e6ce4d
3
- size 34728689
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d8dd78178fede114090ae8138e9fcf2c23e1de7efed7d9567e9eee82e78b11b
3
+ size 35525901
SoccerTwos/events.out.tfevents.1680172555.linux.fritz.box.18610.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e325fc91e09ae0a47bf1293cce940c6547a2690a7524ea340faa1fd9c6b08c3
3
+ size 5349667
config.json CHANGED
@@ -1 +1 @@
1
- {"default_settings": null, "behaviors": {"SoccerTwos": {"trainer_type": "poca", "hyperparameters": {"batch_size": 4096, "buffer_size": 204800, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 500000, "network_settings": {"normalize": false, "hidden_units": 512, "num_layers": 3, "vis_encode_type": "fully_connected", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.995, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 5, "even_checkpoints": false, "max_steps": 30000000, "time_horizon": 1000, "summary_freq": 10000, "threaded": false, "self_play": {"save_steps": 50000, "team_change": 250000, "swap_steps": 10000, "window": 10, "play_against_latest_model_ratio": 0.5, "initial_elo": 1200.0}, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/SoccerTwos/SoccerTwos.exe", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SoccerTwos5", "initialize_from": null, "load_model": false, "resume": true, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}
 
1
+ {"default_settings": null, "behaviors": {"SoccerTwos": {"trainer_type": "poca", "hyperparameters": {"batch_size": 4096, "buffer_size": 204800, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 500000, "network_settings": {"normalize": false, "hidden_units": 512, "num_layers": 3, "vis_encode_type": "fully_connected", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.995, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}, "curiosity": {"gamma": 0.9, "strength": 0.01, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "learning_rate": 0.0003, "encoding_size": null}}, "init_path": null, "keep_checkpoints": 5, "even_checkpoints": false, "max_steps": 90000000, "time_horizon": 1000, "summary_freq": 10000, "threaded": false, "self_play": {"save_steps": 50000, "team_change": 250000, "swap_steps": 10000, "window": 30, "play_against_latest_model_ratio": 0.5, "initial_elo": 1200.0}, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/SoccerTwos/SoccerTwos.exe", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SoccerTwos5", "initialize_from": null, "load_model": false, "resume": true, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}
configuration.yaml CHANGED
@@ -34,10 +34,23 @@ behaviors:
34
  memory: null
35
  goal_conditioning_type: hyper
36
  deterministic: false
 
 
 
 
 
 
 
 
 
 
 
 
 
37
  init_path: null
38
  keep_checkpoints: 5
39
  even_checkpoints: false
40
- max_steps: 30000000
41
  time_horizon: 1000
42
  summary_freq: 10000
43
  threaded: false
@@ -45,7 +58,7 @@ behaviors:
45
  save_steps: 50000
46
  team_change: 250000
47
  swap_steps: 10000
48
- window: 10
49
  play_against_latest_model_ratio: 0.5
50
  initial_elo: 1200.0
51
  behavioral_cloning: null
 
34
  memory: null
35
  goal_conditioning_type: hyper
36
  deterministic: false
37
+ curiosity:
38
+ gamma: 0.9
39
+ strength: 0.01
40
+ network_settings:
41
+ normalize: false
42
+ hidden_units: 128
43
+ num_layers: 2
44
+ vis_encode_type: simple
45
+ memory: null
46
+ goal_conditioning_type: hyper
47
+ deterministic: false
48
+ learning_rate: 0.0003
49
+ encoding_size: null
50
  init_path: null
51
  keep_checkpoints: 5
52
  even_checkpoints: false
53
+ max_steps: 90000000
54
  time_horizon: 1000
55
  summary_freq: 10000
56
  threaded: false
 
58
  save_steps: 50000
59
  team_change: 250000
60
  swap_steps: 10000
61
+ window: 30
62
  play_against_latest_model_ratio: 0.5
63
  initial_elo: 1200.0
64
  behavioral_cloning: null
run_logs/Player-0.log CHANGED
@@ -11,7 +11,7 @@ NullGfxDevice:
11
  Renderer: Null Device
12
  Vendor: Unity Technologies
13
  Begin MonoManager ReloadAssembly
14
- - Completed reload, in 0.155 seconds
15
  ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
16
  ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
17
  ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
@@ -36,7 +36,7 @@ ERROR: Shader Standard shader is not supported on this GPU (none of subshaders/f
36
  WARNING: Shader Unsupported: 'Standard' - All subshaders removed
37
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
38
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
39
- UnloadTime: 0.744856 ms
40
  Registered Communicator in Agent.
41
  ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
42
  requesting resize 84 x 84
@@ -45,7 +45,7 @@ Memory Statistics:
45
  [ALLOC_TEMP_TLS] TLS Allocator
46
  StackAllocators :
47
  [ALLOC_TEMP_MAIN]
48
- Peak usage frame count: [8.0 KB-16.0 KB]: 183132 frames, [2.0 MB-4.0 MB]: 1 frames
49
  Initial Block Size 4.0 MB
50
  Current Block Size 4.0 MB
51
  Peak Allocated Bytes 2.1 MB
@@ -73,7 +73,7 @@ Memory Statistics:
73
  [ALLOC_TEMP_Job.Worker 0]
74
  Initial Block Size 256.0 KB
75
  Current Block Size 256.0 KB
76
- Peak Allocated Bytes 0 B
77
  Overflow Count 0
78
  [ALLOC_TEMP_Background Job.Worker 10]
79
  Initial Block Size 32.0 KB
@@ -143,7 +143,7 @@ Memory Statistics:
143
  [ALLOC_TEMP_Job.Worker 2]
144
  Initial Block Size 256.0 KB
145
  Current Block Size 256.0 KB
146
- Peak Allocated Bytes 0.7 KB
147
  Overflow Count 0
148
  [ALLOC_TEMP_Background Job.Worker 3]
149
  Initial Block Size 32.0 KB
@@ -177,16 +177,16 @@ Memory Statistics:
177
  Used Block count 1
178
  Peak Allocated bytes 1.0 MB
179
  [ALLOC_DEFAULT_MAIN]
180
- Peak usage frame count: [4.0 MB-8.0 MB]: 183133 frames
181
  Requested Block Size 16.0 MB
182
  Peak Block count 1
183
- Peak Allocated memory 4.6 MB
184
  Peak Large allocation bytes 0 B
185
  [ALLOC_DEFAULT_THREAD]
186
- Peak usage frame count: [16.0 MB-32.0 MB]: 183133 frames
187
  Requested Block Size 16.0 MB
188
  Peak Block count 1
189
- Peak Allocated memory 17.6 MB
190
  Peak Large allocation bytes 16.0 MB
191
  [ALLOC_TEMP_JOB_1_FRAME]
192
  Initial Block Size 2.0 MB
@@ -215,13 +215,13 @@ Memory Statistics:
215
  Used Block count 1
216
  Peak Allocated bytes 1.0 MB
217
  [ALLOC_GFX_MAIN]
218
- Peak usage frame count: [32.0 KB-64.0 KB]: 183132 frames, [64.0 KB-128.0 KB]: 1 frames
219
  Requested Block Size 16.0 MB
220
  Peak Block count 1
221
  Peak Allocated memory 65.6 KB
222
  Peak Large allocation bytes 0 B
223
  [ALLOC_GFX_THREAD]
224
- Peak usage frame count: [128.0 KB-256.0 KB]: 183133 frames
225
  Requested Block Size 16.0 MB
226
  Peak Block count 1
227
  Peak Allocated memory 173.5 KB
@@ -233,16 +233,16 @@ Memory Statistics:
233
  Used Block count 1
234
  Peak Allocated bytes 1.0 MB
235
  [ALLOC_CACHEOBJECTS_MAIN]
236
- Peak usage frame count: [0.5 MB-1.0 MB]: 183133 frames
237
  Requested Block Size 4.0 MB
238
  Peak Block count 1
239
  Peak Allocated memory 0.6 MB
240
  Peak Large allocation bytes 0 B
241
  [ALLOC_CACHEOBJECTS_THREAD]
242
- Peak usage frame count: [0.5 MB-1.0 MB]: 183132 frames, [4.0 MB-8.0 MB]: 1 frames
243
  Requested Block Size 4.0 MB
244
  Peak Block count 2
245
- Peak Allocated memory 4.4 MB
246
  Peak Large allocation bytes 0 B
247
  [ALLOC_TYPETREE] Dual Thread Allocator
248
  Peak main deferred allocation count 0
@@ -251,13 +251,13 @@ Memory Statistics:
251
  Used Block count 1
252
  Peak Allocated bytes 1.0 MB
253
  [ALLOC_TYPETREE_MAIN]
254
- Peak usage frame count: [0-1.0 KB]: 183133 frames
255
  Requested Block Size 2.0 MB
256
  Peak Block count 1
257
  Peak Allocated memory 1.0 KB
258
  Peak Large allocation bytes 0 B
259
  [ALLOC_TYPETREE_THREAD]
260
- Peak usage frame count: [1.0 KB-2.0 KB]: 183132 frames, [2.0 KB-4.0 KB]: 1 frames
261
  Requested Block Size 2.0 MB
262
  Peak Block count 1
263
  Peak Allocated memory 2.2 KB
 
11
  Renderer: Null Device
12
  Vendor: Unity Technologies
13
  Begin MonoManager ReloadAssembly
14
+ - Completed reload, in 0.081 seconds
15
  ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
16
  ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
17
  ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 
36
  WARNING: Shader Unsupported: 'Standard' - All subshaders removed
37
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
38
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
39
+ UnloadTime: 0.668976 ms
40
  Registered Communicator in Agent.
41
  ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
42
  requesting resize 84 x 84
 
45
  [ALLOC_TEMP_TLS] TLS Allocator
46
  StackAllocators :
47
  [ALLOC_TEMP_MAIN]
48
+ Peak usage frame count: [8.0 KB-16.0 KB]: 97182 frames, [2.0 MB-4.0 MB]: 1 frames
49
  Initial Block Size 4.0 MB
50
  Current Block Size 4.0 MB
51
  Peak Allocated Bytes 2.1 MB
 
73
  [ALLOC_TEMP_Job.Worker 0]
74
  Initial Block Size 256.0 KB
75
  Current Block Size 256.0 KB
76
+ Peak Allocated Bytes 0.7 KB
77
  Overflow Count 0
78
  [ALLOC_TEMP_Background Job.Worker 10]
79
  Initial Block Size 32.0 KB
 
143
  [ALLOC_TEMP_Job.Worker 2]
144
  Initial Block Size 256.0 KB
145
  Current Block Size 256.0 KB
146
+ Peak Allocated Bytes 0 B
147
  Overflow Count 0
148
  [ALLOC_TEMP_Background Job.Worker 3]
149
  Initial Block Size 32.0 KB
 
177
  Used Block count 1
178
  Peak Allocated bytes 1.0 MB
179
  [ALLOC_DEFAULT_MAIN]
180
+ Peak usage frame count: [4.0 MB-8.0 MB]: 97183 frames
181
  Requested Block Size 16.0 MB
182
  Peak Block count 1
183
+ Peak Allocated memory 4.8 MB
184
  Peak Large allocation bytes 0 B
185
  [ALLOC_DEFAULT_THREAD]
186
+ Peak usage frame count: [16.0 MB-32.0 MB]: 97183 frames
187
  Requested Block Size 16.0 MB
188
  Peak Block count 1
189
+ Peak Allocated memory 17.4 MB
190
  Peak Large allocation bytes 16.0 MB
191
  [ALLOC_TEMP_JOB_1_FRAME]
192
  Initial Block Size 2.0 MB
 
215
  Used Block count 1
216
  Peak Allocated bytes 1.0 MB
217
  [ALLOC_GFX_MAIN]
218
+ Peak usage frame count: [32.0 KB-64.0 KB]: 97182 frames, [64.0 KB-128.0 KB]: 1 frames
219
  Requested Block Size 16.0 MB
220
  Peak Block count 1
221
  Peak Allocated memory 65.6 KB
222
  Peak Large allocation bytes 0 B
223
  [ALLOC_GFX_THREAD]
224
+ Peak usage frame count: [128.0 KB-256.0 KB]: 97183 frames
225
  Requested Block Size 16.0 MB
226
  Peak Block count 1
227
  Peak Allocated memory 173.5 KB
 
233
  Used Block count 1
234
  Peak Allocated bytes 1.0 MB
235
  [ALLOC_CACHEOBJECTS_MAIN]
236
+ Peak usage frame count: [0.5 MB-1.0 MB]: 97183 frames
237
  Requested Block Size 4.0 MB
238
  Peak Block count 1
239
  Peak Allocated memory 0.6 MB
240
  Peak Large allocation bytes 0 B
241
  [ALLOC_CACHEOBJECTS_THREAD]
242
+ Peak usage frame count: [0.5 MB-1.0 MB]: 97182 frames, [4.0 MB-8.0 MB]: 1 frames
243
  Requested Block Size 4.0 MB
244
  Peak Block count 2
245
+ Peak Allocated memory 4.5 MB
246
  Peak Large allocation bytes 0 B
247
  [ALLOC_TYPETREE] Dual Thread Allocator
248
  Peak main deferred allocation count 0
 
251
  Used Block count 1
252
  Peak Allocated bytes 1.0 MB
253
  [ALLOC_TYPETREE_MAIN]
254
+ Peak usage frame count: [0-1.0 KB]: 97183 frames
255
  Requested Block Size 2.0 MB
256
  Peak Block count 1
257
  Peak Allocated memory 1.0 KB
258
  Peak Large allocation bytes 0 B
259
  [ALLOC_TYPETREE_THREAD]
260
+ Peak usage frame count: [1.0 KB-2.0 KB]: 97182 frames, [2.0 KB-4.0 KB]: 1 frames
261
  Requested Block Size 2.0 MB
262
  Peak Block count 1
263
  Peak Allocated memory 2.2 KB
run_logs/timers.json CHANGED
@@ -2,201 +2,261 @@
2
  "name": "root",
3
  "gauges": {
4
  "SoccerTwos.Policy.Entropy.mean": {
5
- "value": 1.7348119020462036,
6
- "min": 1.7348119020462036,
7
- "max": 2.1338491439819336,
8
- "count": 974
9
  },
10
  "SoccerTwos.Policy.Entropy.sum": {
11
- "value": 29144.83984375,
12
- "min": 1606.896484375,
13
- "max": 48490.890625,
14
- "count": 974
15
  },
16
  "SoccerTwos.Environment.EpisodeLength.mean": {
17
- "value": 55.86206896551724,
18
- "min": 22.0,
19
- "max": 85.24137931034483,
20
- "count": 974
21
  },
22
  "SoccerTwos.Environment.EpisodeLength.sum": {
23
- "value": 19440.0,
24
- "min": 88.0,
25
- "max": 21752.0,
26
- "count": 974
27
  },
28
  "SoccerTwos.Self-play.ELO.mean": {
29
- "value": 1761.567949531139,
30
- "min": 1718.6108505610346,
31
- "max": 1803.8036335559661,
32
- "count": 974
33
  },
34
  "SoccerTwos.Self-play.ELO.sum": {
35
- "value": 306512.82321841817,
36
- "min": 3474.259222005546,
37
- "max": 447654.8648728988,
38
- "count": 974
39
- },
40
- "SoccerTwos.IsTraining.mean": {
41
- "value": 1.0,
42
- "min": 1.0,
43
- "max": 1.0,
44
- "count": 974
45
- },
46
- "SoccerTwos.IsTraining.sum": {
47
- "value": 1.0,
48
- "min": 1.0,
49
- "max": 1.0,
50
- "count": 974
51
  },
52
  "SoccerTwos.Step.mean": {
53
- "value": 28469980.0,
54
- "min": 18749904.0,
55
- "max": 28469980.0,
56
- "count": 973
57
  },
58
  "SoccerTwos.Step.sum": {
59
- "value": 28469980.0,
60
- "min": 18749904.0,
61
- "max": 28469980.0,
62
- "count": 973
63
  },
64
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
65
- "value": -0.029856232926249504,
66
- "min": -0.13772714138031006,
67
- "max": 0.06465017795562744,
68
- "count": 973
69
  },
70
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
71
- "value": -5.2248406410217285,
72
- "min": -23.138160705566406,
73
- "max": 12.154233932495117,
74
- "count": 973
75
  },
76
  "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
77
- "value": -0.02988698147237301,
78
- "min": -0.14075849950313568,
79
- "max": 0.06273878365755081,
80
- "count": 973
81
  },
82
  "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
83
- "value": -5.230221748352051,
84
- "min": -23.647428512573242,
85
- "max": 11.794891357421875,
86
- "count": 973
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
87
  },
88
  "SoccerTwos.Environment.CumulativeReward.mean": {
89
  "value": 0.0,
90
  "min": 0.0,
91
  "max": 0.0,
92
- "count": 973
93
  },
94
  "SoccerTwos.Environment.CumulativeReward.sum": {
95
  "value": 0.0,
96
  "min": 0.0,
97
  "max": 0.0,
98
- "count": 973
99
  },
100
  "SoccerTwos.Policy.ExtrinsicReward.mean": {
101
- "value": -0.05570971488952637,
102
- "min": -0.37514444523387486,
103
- "max": 0.24607526935556884,
104
- "count": 973
105
  },
106
  "SoccerTwos.Policy.ExtrinsicReward.sum": {
107
- "value": -9.749200105667114,
108
- "min": -67.52600014209747,
109
- "max": 45.7700001001358,
110
- "count": 973
 
 
 
 
 
 
 
 
 
 
 
 
111
  },
112
  "SoccerTwos.Environment.GroupCumulativeReward.mean": {
113
- "value": -0.05570971488952637,
114
- "min": -0.37514444523387486,
115
- "max": 0.24607526935556884,
116
- "count": 973
117
  },
118
  "SoccerTwos.Environment.GroupCumulativeReward.sum": {
119
- "value": -9.749200105667114,
120
- "min": -67.52600014209747,
121
- "max": 45.7700001001358,
122
- "count": 973
 
 
 
 
 
 
 
 
 
 
 
 
123
  },
124
  "SoccerTwos.Losses.PolicyLoss.mean": {
125
- "value": 0.012733476008288563,
126
- "min": 0.011228136497666128,
127
- "max": 0.013726944572093391,
128
- "count": 47
129
  },
130
  "SoccerTwos.Losses.PolicyLoss.sum": {
131
- "value": 0.012733476008288563,
132
- "min": 0.011228136497666128,
133
- "max": 0.013726944572093391,
134
- "count": 47
135
  },
136
  "SoccerTwos.Losses.ValueLoss.mean": {
137
- "value": 0.12843565613031388,
138
- "min": 0.11572077537576357,
139
- "max": 0.12922100678086282,
140
- "count": 47
141
  },
142
  "SoccerTwos.Losses.ValueLoss.sum": {
143
- "value": 0.12843565613031388,
144
- "min": 0.11572077537576357,
145
- "max": 0.12922100678086282,
146
- "count": 47
147
  },
148
  "SoccerTwos.Losses.BaselineLoss.mean": {
149
- "value": 0.12908015037576356,
150
- "min": 0.11725246061881384,
151
- "max": 0.12977993567784626,
152
- "count": 47
153
  },
154
  "SoccerTwos.Losses.BaselineLoss.sum": {
155
- "value": 0.12908015037576356,
156
- "min": 0.11725246061881384,
157
- "max": 0.12977993567784626,
158
- "count": 47
159
  },
160
  "SoccerTwos.Policy.LearningRate.mean": {
161
- "value": 1.6292574569173326e-05,
162
- "min": 1.6292574569173326e-05,
163
- "max": 0.00011054928315026,
164
- "count": 47
165
  },
166
  "SoccerTwos.Policy.LearningRate.sum": {
167
- "value": 1.6292574569173326e-05,
168
- "min": 1.6292574569173326e-05,
169
- "max": 0.00011054928315026,
170
- "count": 47
171
  },
172
  "SoccerTwos.Policy.Epsilon.mean": {
173
- "value": 0.10543082666666669,
174
- "min": 0.10543082666666669,
175
- "max": 0.13684974,
176
- "count": 47
177
  },
178
  "SoccerTwos.Policy.Epsilon.sum": {
179
- "value": 0.10543082666666669,
180
- "min": 0.10543082666666669,
181
- "max": 0.13684974,
182
- "count": 47
183
  },
184
  "SoccerTwos.Policy.Beta.mean": {
185
- "value": 0.00028099825066666665,
186
- "min": 0.00028099825066666665,
187
- "max": 0.001848802026,
188
- "count": 47
189
  },
190
  "SoccerTwos.Policy.Beta.sum": {
191
- "value": 0.00028099825066666665,
192
- "min": 0.00028099825066666665,
193
- "max": 0.001848802026,
194
- "count": 47
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
195
  }
196
  },
197
  "metadata": {
198
  "timer_format_version": "0.1.0",
199
- "start_time_seconds": "1680129716",
200
  "python_version": "3.9.16 | packaged by conda-forge | (main, Feb 1 2023, 21:39:03) \n[GCC 11.3.0]",
201
  "command_line_arguments": "/home/ringo/mambaforge/envs/hfrl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.exe --run-id=SoccerTwos5 --no-graphics --resume",
202
  "mlagents_version": "0.31.0.dev0",
@@ -204,59 +264,59 @@
204
  "communication_protocol_version": "1.5.0",
205
  "pytorch_version": "1.11.0+cu102",
206
  "numpy_version": "1.21.2",
207
- "end_time_seconds": "1680172438"
208
  },
209
- "total": 42722.574667928,
210
  "count": 1,
211
- "self": 0.0759030100016389,
212
  "children": {
213
  "run_training.setup": {
214
- "total": 0.025251507002394646,
215
  "count": 1,
216
- "self": 0.025251507002394646
217
  },
218
  "TrainerController.start_learning": {
219
- "total": 42722.473513410994,
220
  "count": 1,
221
- "self": 19.858428147112136,
222
  "children": {
223
  "TrainerController._reset_env": {
224
- "total": 2.5805474780063378,
225
- "count": 40,
226
- "self": 2.5805474780063378
227
  },
228
  "TrainerController.advance": {
229
- "total": 42699.72945140685,
230
- "count": 679082,
231
- "self": 23.77234519814374,
232
  "children": {
233
  "env_step": {
234
- "total": 15710.199912431635,
235
- "count": 679082,
236
- "self": 12746.711335640968,
237
  "children": {
238
  "SubprocessEnvManager._take_step": {
239
- "total": 2952.1668921852106,
240
- "count": 679082,
241
- "self": 136.18300451725372,
242
  "children": {
243
  "TorchPolicy.evaluate": {
244
- "total": 2815.983887667957,
245
- "count": 1220900,
246
- "self": 2815.983887667957
247
  }
248
  }
249
  },
250
  "workers": {
251
- "total": 11.32168460545654,
252
- "count": 679081,
253
  "self": 0.0,
254
  "children": {
255
  "worker_root": {
256
- "total": 42684.878815808435,
257
- "count": 679081,
258
  "is_parallel": true,
259
- "self": 32150.423927959564,
260
  "children": {
261
  "run_training.setup": {
262
  "total": 0.0,
@@ -265,48 +325,48 @@
265
  "self": 0.0,
266
  "children": {
267
  "steps_from_proto": {
268
- "total": 0.0065970009891316295,
269
  "count": 2,
270
  "is_parallel": true,
271
- "self": 0.001290915985009633,
272
  "children": {
273
  "_process_rank_one_or_two_observation": {
274
- "total": 0.0053060850041219965,
275
  "count": 8,
276
  "is_parallel": true,
277
- "self": 0.0053060850041219965
278
  }
279
  }
280
  },
281
  "UnityEnvironment.step": {
282
- "total": 0.10075123800197616,
283
  "count": 1,
284
  "is_parallel": true,
285
- "self": 0.0012871539947809651,
286
  "children": {
287
  "UnityEnvironment._generate_step_input": {
288
- "total": 0.0007557589997304603,
289
  "count": 1,
290
  "is_parallel": true,
291
- "self": 0.0007557589997304603
292
  },
293
  "communicator.exchange": {
294
- "total": 0.0864543719944777,
295
  "count": 1,
296
  "is_parallel": true,
297
- "self": 0.0864543719944777
298
  },
299
  "steps_from_proto": {
300
- "total": 0.01225395301298704,
301
  "count": 2,
302
  "is_parallel": true,
303
- "self": 0.007683153031393886,
304
  "children": {
305
  "_process_rank_one_or_two_observation": {
306
- "total": 0.004570799981593154,
307
  "count": 8,
308
  "is_parallel": true,
309
- "self": 0.004570799981593154
310
  }
311
  }
312
  }
@@ -315,48 +375,48 @@
315
  }
316
  },
317
  "steps_from_proto": {
318
- "total": 0.10548005497548729,
319
- "count": 78,
320
  "is_parallel": true,
321
- "self": 0.019453318280284293,
322
  "children": {
323
  "_process_rank_one_or_two_observation": {
324
- "total": 0.086026736695203,
325
- "count": 312,
326
  "is_parallel": true,
327
- "self": 0.086026736695203
328
  }
329
  }
330
  },
331
  "UnityEnvironment.step": {
332
- "total": 10534.349407793896,
333
- "count": 679080,
334
  "is_parallel": true,
335
- "self": 671.891442082604,
336
  "children": {
337
  "UnityEnvironment._generate_step_input": {
338
- "total": 436.96546818055504,
339
- "count": 679080,
340
  "is_parallel": true,
341
- "self": 436.96546818055504
342
  },
343
  "communicator.exchange": {
344
- "total": 7533.343012046884,
345
- "count": 679080,
346
  "is_parallel": true,
347
- "self": 7533.343012046884
348
  },
349
  "steps_from_proto": {
350
- "total": 1892.149485483853,
351
- "count": 1358160,
352
  "is_parallel": true,
353
- "self": 372.890244903494,
354
  "children": {
355
  "_process_rank_one_or_two_observation": {
356
- "total": 1519.259240580359,
357
- "count": 5432640,
358
  "is_parallel": true,
359
- "self": 1519.259240580359
360
  }
361
  }
362
  }
@@ -369,31 +429,31 @@
369
  }
370
  },
371
  "trainer_advance": {
372
- "total": 26965.75719377707,
373
- "count": 679081,
374
- "self": 128.03335191983206,
375
  "children": {
376
  "process_trajectory": {
377
- "total": 3997.3622430362157,
378
- "count": 679081,
379
- "self": 3991.13507309719,
380
  "children": {
381
  "RLTrainer._checkpoint": {
382
- "total": 6.227169939025771,
383
- "count": 19,
384
- "self": 6.227169939025771
385
  }
386
  }
387
  },
388
  "_update_policy": {
389
- "total": 22840.361598821022,
390
- "count": 47,
391
- "self": 1953.111261621816,
392
  "children": {
393
  "TorchPOCAOptimizer.update": {
394
- "total": 20887.250337199206,
395
- "count": 7050,
396
- "self": 20887.250337199206
397
  }
398
  }
399
  }
@@ -402,19 +462,19 @@
402
  }
403
  },
404
  "trainer_threads": {
405
- "total": 8.970091585069895e-07,
406
  "count": 1,
407
- "self": 8.970091585069895e-07
408
  },
409
  "TrainerController._save_models": {
410
- "total": 0.30508548201760277,
411
  "count": 1,
412
- "self": 0.0037372090155258775,
413
  "children": {
414
  "RLTrainer._checkpoint": {
415
- "total": 0.3013482730020769,
416
  "count": 1,
417
- "self": 0.3013482730020769
418
  }
419
  }
420
  }
 
2
  "name": "root",
3
  "gauges": {
4
  "SoccerTwos.Policy.Entropy.mean": {
5
+ "value": 1.6544617414474487,
6
+ "min": 1.6383187770843506,
7
+ "max": 1.771085500717163,
8
+ "count": 517
9
  },
10
  "SoccerTwos.Policy.Entropy.sum": {
11
+ "value": 32295.09375,
12
+ "min": 10663.513671875,
13
+ "max": 39872.62890625,
14
+ "count": 517
15
  },
16
  "SoccerTwos.Environment.EpisodeLength.mean": {
17
+ "value": 52.989010989010985,
18
+ "min": 36.21212121212121,
19
+ "max": 75.50769230769231,
20
+ "count": 517
21
  },
22
  "SoccerTwos.Environment.EpisodeLength.sum": {
23
+ "value": 19288.0,
24
+ "min": 4780.0,
25
+ "max": 20732.0,
26
+ "count": 517
27
  },
28
  "SoccerTwos.Self-play.ELO.mean": {
29
+ "value": 1783.9345993395016,
30
+ "min": 1739.4789078559804,
31
+ "max": 1819.578822229663,
32
+ "count": 517
33
  },
34
  "SoccerTwos.Self-play.ELO.sum": {
35
+ "value": 324676.09707978927,
36
+ "min": 115798.43448098522,
37
+ "max": 439690.6603627888,
38
+ "count": 517
 
 
 
 
 
 
 
 
 
 
 
 
39
  },
40
  "SoccerTwos.Step.mean": {
41
+ "value": 33639986.0,
42
+ "min": 28479978.0,
43
+ "max": 33639986.0,
44
+ "count": 517
45
  },
46
  "SoccerTwos.Step.sum": {
47
+ "value": 33639986.0,
48
+ "min": 28479978.0,
49
+ "max": 33639986.0,
50
+ "count": 517
51
  },
52
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
53
+ "value": -0.018630528822541237,
54
+ "min": -0.11188879609107971,
55
+ "max": 0.07426375895738602,
56
+ "count": 517
57
  },
58
  "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
59
+ "value": -3.390756130218506,
60
+ "min": -21.461830139160156,
61
+ "max": 13.765193939208984,
62
+ "count": 517
63
  },
64
  "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
65
+ "value": -0.018748609349131584,
66
+ "min": -0.10551068186759949,
67
+ "max": 0.07412952184677124,
68
+ "count": 517
69
  },
70
  "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
71
+ "value": -3.4122469425201416,
72
+ "min": -20.84265899658203,
73
+ "max": 14.455087661743164,
74
+ "count": 517
75
+ },
76
+ "SoccerTwos.Policy.CuriosityBaselineEstimate.mean": {
77
+ "value": 0.006533732172101736,
78
+ "min": 0.006031353026628494,
79
+ "max": 0.09678366780281067,
80
+ "count": 517
81
+ },
82
+ "SoccerTwos.Policy.CuriosityBaselineEstimate.sum": {
83
+ "value": 1.1891392469406128,
84
+ "min": 0.9304066896438599,
85
+ "max": 20.50408935546875,
86
+ "count": 517
87
+ },
88
+ "SoccerTwos.Policy.CuriosityValueEstimate.mean": {
89
+ "value": 0.006480127107352018,
90
+ "min": 0.005918653681874275,
91
+ "max": 0.09726906567811966,
92
+ "count": 517
93
+ },
94
+ "SoccerTwos.Policy.CuriosityValueEstimate.sum": {
95
+ "value": 1.1793831586837769,
96
+ "min": 0.913135290145874,
97
+ "max": 20.615158081054688,
98
+ "count": 517
99
  },
100
  "SoccerTwos.Environment.CumulativeReward.mean": {
101
  "value": 0.0,
102
  "min": 0.0,
103
  "max": 0.0,
104
+ "count": 517
105
  },
106
  "SoccerTwos.Environment.CumulativeReward.sum": {
107
  "value": 0.0,
108
  "min": 0.0,
109
  "max": 0.0,
110
+ "count": 517
111
  },
112
  "SoccerTwos.Policy.ExtrinsicReward.mean": {
113
+ "value": -0.07899780391336797,
114
+ "min": -0.32739889358288676,
115
+ "max": 0.33040844974383504,
116
+ "count": 517
117
  },
118
  "SoccerTwos.Policy.ExtrinsicReward.sum": {
119
+ "value": -14.377600312232971,
120
+ "min": -59.2591997385025,
121
+ "max": 47.84479957818985,
122
+ "count": 517
123
+ },
124
+ "SoccerTwos.Policy.CuriosityReward.mean": {
125
+ "value": 0.03525229465794637,
126
+ "min": 0.0,
127
+ "max": 0.24388014633286667,
128
+ "count": 517
129
+ },
130
+ "SoccerTwos.Policy.CuriosityReward.sum": {
131
+ "value": 6.415917627746239,
132
+ "min": 0.0,
133
+ "max": 36.89434967190027,
134
+ "count": 517
135
  },
136
  "SoccerTwos.Environment.GroupCumulativeReward.mean": {
137
+ "value": -0.07899780391336797,
138
+ "min": -0.32739889358288676,
139
+ "max": 0.33040844974383504,
140
+ "count": 517
141
  },
142
  "SoccerTwos.Environment.GroupCumulativeReward.sum": {
143
+ "value": -14.377600312232971,
144
+ "min": -59.2591997385025,
145
+ "max": 47.84479957818985,
146
+ "count": 517
147
+ },
148
+ "SoccerTwos.IsTraining.mean": {
149
+ "value": 1.0,
150
+ "min": 1.0,
151
+ "max": 1.0,
152
+ "count": 517
153
+ },
154
+ "SoccerTwos.IsTraining.sum": {
155
+ "value": 1.0,
156
+ "min": 1.0,
157
+ "max": 1.0,
158
+ "count": 517
159
  },
160
  "SoccerTwos.Losses.PolicyLoss.mean": {
161
+ "value": 0.01082317113565902,
162
+ "min": 0.010641817656190445,
163
+ "max": 0.013228910765095254,
164
+ "count": 25
165
  },
166
  "SoccerTwos.Losses.PolicyLoss.sum": {
167
+ "value": 0.01082317113565902,
168
+ "min": 0.010641817656190445,
169
+ "max": 0.013228910765095254,
170
+ "count": 25
171
  },
172
  "SoccerTwos.Losses.ValueLoss.mean": {
173
+ "value": 0.0611632056782643,
174
+ "min": 0.058945538699626925,
175
+ "max": 0.06389266346891721,
176
+ "count": 25
177
  },
178
  "SoccerTwos.Losses.ValueLoss.sum": {
179
+ "value": 0.0611632056782643,
180
+ "min": 0.058945538699626925,
181
+ "max": 0.06389266346891721,
182
+ "count": 25
183
  },
184
  "SoccerTwos.Losses.BaselineLoss.mean": {
185
+ "value": 0.06231740226348241,
186
+ "min": 0.06012462628384431,
187
+ "max": 0.06539666548371315,
188
+ "count": 25
189
  },
190
  "SoccerTwos.Losses.BaselineLoss.sum": {
191
+ "value": 0.06231740226348241,
192
+ "min": 0.06012462628384431,
193
+ "max": 0.06539666548371315,
194
+ "count": 25
195
  },
196
  "SoccerTwos.Policy.LearningRate.mean": {
197
+ "value": 0.0001879993440002311,
198
+ "min": 0.0001879993440002311,
199
+ "max": 0.00020439037186988668,
200
+ "count": 25
201
  },
202
  "SoccerTwos.Policy.LearningRate.sum": {
203
+ "value": 0.0001879993440002311,
204
+ "min": 0.0001879993440002311,
205
+ "max": 0.00020439037186988668,
206
+ "count": 25
207
  },
208
  "SoccerTwos.Policy.Epsilon.mean": {
209
+ "value": 0.16266643555555557,
210
+ "min": 0.16266643555555557,
211
+ "max": 0.1681301133333333,
212
+ "count": 25
213
  },
214
  "SoccerTwos.Policy.Epsilon.sum": {
215
+ "value": 0.16266643555555557,
216
+ "min": 0.16266643555555557,
217
+ "max": 0.1681301133333333,
218
+ "count": 25
219
  },
220
  "SoccerTwos.Policy.Beta.mean": {
221
+ "value": 0.003137055134222223,
222
+ "min": 0.003137055134222223,
223
+ "max": 0.003409692655333334,
224
+ "count": 25
225
  },
226
  "SoccerTwos.Policy.Beta.sum": {
227
+ "value": 0.003137055134222223,
228
+ "min": 0.003137055134222223,
229
+ "max": 0.003409692655333334,
230
+ "count": 25
231
+ },
232
+ "SoccerTwos.Losses.CuriosityForwardLoss.mean": {
233
+ "value": 0.06363795998195808,
234
+ "min": 0.06363795998195808,
235
+ "max": 0.4287375779946645,
236
+ "count": 25
237
+ },
238
+ "SoccerTwos.Losses.CuriosityForwardLoss.sum": {
239
+ "value": 0.06363795998195808,
240
+ "min": 0.06363795998195808,
241
+ "max": 0.4287375779946645,
242
+ "count": 25
243
+ },
244
+ "SoccerTwos.Losses.CuriosityInverseLoss.mean": {
245
+ "value": 1.1895974318186442,
246
+ "min": 1.1853395628929138,
247
+ "max": 2.4184607744216917,
248
+ "count": 25
249
+ },
250
+ "SoccerTwos.Losses.CuriosityInverseLoss.sum": {
251
+ "value": 1.1895974318186442,
252
+ "min": 1.1853395628929138,
253
+ "max": 2.4184607744216917,
254
+ "count": 25
255
  }
256
  },
257
  "metadata": {
258
  "timer_format_version": "0.1.0",
259
+ "start_time_seconds": "1680172554",
260
  "python_version": "3.9.16 | packaged by conda-forge | (main, Feb 1 2023, 21:39:03) \n[GCC 11.3.0]",
261
  "command_line_arguments": "/home/ringo/mambaforge/envs/hfrl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.exe --run-id=SoccerTwos5 --no-graphics --resume",
262
  "mlagents_version": "0.31.0.dev0",
 
264
  "communication_protocol_version": "1.5.0",
265
  "pytorch_version": "1.11.0+cu102",
266
  "numpy_version": "1.21.2",
267
+ "end_time_seconds": "1680191712"
268
  },
269
+ "total": 19158.371048654983,
270
  "count": 1,
271
+ "self": 0.06926428701262921,
272
  "children": {
273
  "run_training.setup": {
274
+ "total": 0.012148113979492337,
275
  "count": 1,
276
+ "self": 0.012148113979492337
277
  },
278
  "TrainerController.start_learning": {
279
+ "total": 19158.28963625399,
280
  "count": 1,
281
+ "self": 8.16942810654291,
282
  "children": {
283
  "TrainerController._reset_env": {
284
+ "total": 1.2355314569722395,
285
+ "count": 22,
286
+ "self": 1.2355314569722395
287
  },
288
  "TrainerController.advance": {
289
+ "total": 19147.71053276246,
290
+ "count": 361257,
291
+ "self": 8.56901838304475,
292
  "children": {
293
  "env_step": {
294
+ "total": 6734.64510125207,
295
+ "count": 361257,
296
+ "self": 5508.992406987061,
297
  "children": {
298
  "SubprocessEnvManager._take_step": {
299
+ "total": 1220.7081321968872,
300
+ "count": 361257,
301
+ "self": 53.134995022497606,
302
  "children": {
303
  "TorchPolicy.evaluate": {
304
+ "total": 1167.5731371743896,
305
+ "count": 647900,
306
+ "self": 1167.5731371743896
307
  }
308
  }
309
  },
310
  "workers": {
311
+ "total": 4.944562068121741,
312
+ "count": 361257,
313
  "self": 0.0,
314
  "children": {
315
  "worker_root": {
316
+ "total": 19140.3656414171,
317
+ "count": 361257,
318
  "is_parallel": true,
319
+ "self": 14556.282447089936,
320
  "children": {
321
  "run_training.setup": {
322
  "total": 0.0,
 
325
  "self": 0.0,
326
  "children": {
327
  "steps_from_proto": {
328
+ "total": 0.002159021998522803,
329
  "count": 2,
330
  "is_parallel": true,
331
+ "self": 0.0005102219292894006,
332
  "children": {
333
  "_process_rank_one_or_two_observation": {
334
+ "total": 0.0016488000692334026,
335
  "count": 8,
336
  "is_parallel": true,
337
+ "self": 0.0016488000692334026
338
  }
339
  }
340
  },
341
  "UnityEnvironment.step": {
342
+ "total": 0.03421102600987069,
343
  "count": 1,
344
  "is_parallel": true,
345
+ "self": 0.0008790829742792994,
346
  "children": {
347
  "UnityEnvironment._generate_step_input": {
348
+ "total": 0.0006237560010049492,
349
  "count": 1,
350
  "is_parallel": true,
351
+ "self": 0.0006237560010049492
352
  },
353
  "communicator.exchange": {
354
+ "total": 0.029803024022839963,
355
  "count": 1,
356
  "is_parallel": true,
357
+ "self": 0.029803024022839963
358
  },
359
  "steps_from_proto": {
360
+ "total": 0.002905163011746481,
361
  "count": 2,
362
  "is_parallel": true,
363
+ "self": 0.0005354399618227035,
364
  "children": {
365
  "_process_rank_one_or_two_observation": {
366
+ "total": 0.0023697230499237776,
367
  "count": 8,
368
  "is_parallel": true,
369
+ "self": 0.0023697230499237776
370
  }
371
  }
372
  }
 
375
  }
376
  },
377
  "steps_from_proto": {
378
+ "total": 0.04302037303568795,
379
+ "count": 42,
380
  "is_parallel": true,
381
+ "self": 0.007955353416036814,
382
  "children": {
383
  "_process_rank_one_or_two_observation": {
384
+ "total": 0.03506501961965114,
385
+ "count": 168,
386
  "is_parallel": true,
387
+ "self": 0.03506501961965114
388
  }
389
  }
390
  },
391
  "UnityEnvironment.step": {
392
+ "total": 4584.040173954127,
393
+ "count": 361256,
394
  "is_parallel": true,
395
+ "self": 294.0414173450845,
396
  "children": {
397
  "UnityEnvironment._generate_step_input": {
398
+ "total": 205.20476716093253,
399
+ "count": 361256,
400
  "is_parallel": true,
401
+ "self": 205.20476716093253
402
  },
403
  "communicator.exchange": {
404
+ "total": 3238.665957780555,
405
+ "count": 361256,
406
  "is_parallel": true,
407
+ "self": 3238.665957780555
408
  },
409
  "steps_from_proto": {
410
+ "total": 846.1280316675548,
411
+ "count": 722512,
412
  "is_parallel": true,
413
+ "self": 159.79457659239415,
414
  "children": {
415
  "_process_rank_one_or_two_observation": {
416
+ "total": 686.3334550751606,
417
+ "count": 2890048,
418
  "is_parallel": true,
419
+ "self": 686.3334550751606
420
  }
421
  }
422
  }
 
429
  }
430
  },
431
  "trainer_advance": {
432
+ "total": 12404.496413127345,
433
+ "count": 361257,
434
+ "self": 50.02537562244106,
435
  "children": {
436
  "process_trajectory": {
437
+ "total": 1759.4455397337733,
438
+ "count": 361257,
439
+ "self": 1757.0021228148253,
440
  "children": {
441
  "RLTrainer._checkpoint": {
442
+ "total": 2.44341691894806,
443
+ "count": 11,
444
+ "self": 2.44341691894806
445
  }
446
  }
447
  },
448
  "_update_policy": {
449
+ "total": 10595.02549777113,
450
+ "count": 25,
451
+ "self": 1625.9843534287647,
452
  "children": {
453
  "TorchPOCAOptimizer.update": {
454
+ "total": 8969.041144342365,
455
+ "count": 3750,
456
+ "self": 8969.041144342365
457
  }
458
  }
459
  }
 
462
  }
463
  },
464
  "trainer_threads": {
465
+ "total": 2.4730106815695763e-06,
466
  "count": 1,
467
+ "self": 2.4730106815695763e-06
468
  },
469
  "TrainerController._save_models": {
470
+ "total": 1.1741414550051559,
471
  "count": 1,
472
+ "self": 0.006163765996461734,
473
  "children": {
474
  "RLTrainer._checkpoint": {
475
+ "total": 1.1679776890086941,
476
  "count": 1,
477
+ "self": 1.1679776890086941
478
  }
479
  }
480
  }
run_logs/training_status.json CHANGED
@@ -2,59 +2,59 @@
2
  "SoccerTwos": {
3
  "checkpoints": [
4
  {
5
- "steps": 26499995,
6
- "file_path": "results/SoccerTwos5/SoccerTwos/SoccerTwos-26499995.onnx",
7
  "reward": 0.0,
8
- "creation_time": 1680163679.061089,
9
  "auxillary_file_paths": [
10
- "results/SoccerTwos5/SoccerTwos/SoccerTwos-26499995.pt"
11
  ]
12
  },
13
  {
14
- "steps": 26999977,
15
- "file_path": "results/SoccerTwos5/SoccerTwos/SoccerTwos-26999977.onnx",
16
  "reward": 0.0,
17
- "creation_time": 1680166516.4965715,
18
  "auxillary_file_paths": [
19
- "results/SoccerTwos5/SoccerTwos/SoccerTwos-26999977.pt"
20
  ]
21
  },
22
  {
23
- "steps": 27499864,
24
- "file_path": "results/SoccerTwos5/SoccerTwos/SoccerTwos-27499864.onnx",
25
  "reward": 0.0,
26
- "creation_time": 1680168793.6688595,
27
  "auxillary_file_paths": [
28
- "results/SoccerTwos5/SoccerTwos/SoccerTwos-27499864.pt"
29
  ]
30
  },
31
  {
32
- "steps": 27999982,
33
- "file_path": "results/SoccerTwos5/SoccerTwos/SoccerTwos-27999982.onnx",
34
  "reward": 0.0,
35
- "creation_time": 1680170873.503431,
36
  "auxillary_file_paths": [
37
- "results/SoccerTwos5/SoccerTwos/SoccerTwos-27999982.pt"
38
  ]
39
  },
40
  {
41
- "steps": 28477740,
42
- "file_path": "results/SoccerTwos5/SoccerTwos/SoccerTwos-28477740.onnx",
43
  "reward": 0.0,
44
- "creation_time": 1680172438.7580104,
45
  "auxillary_file_paths": [
46
- "results/SoccerTwos5/SoccerTwos/SoccerTwos-28477740.pt"
47
  ]
48
  }
49
  ],
50
- "elo": 1755.2629314981316,
51
  "final_checkpoint": {
52
- "steps": 28477740,
53
  "file_path": "results/SoccerTwos5/SoccerTwos.onnx",
54
  "reward": 0.0,
55
- "creation_time": 1680172438.7580104,
56
  "auxillary_file_paths": [
57
- "results/SoccerTwos5/SoccerTwos/SoccerTwos-28477740.pt"
58
  ]
59
  }
60
  },
 
2
  "SoccerTwos": {
3
  "checkpoints": [
4
  {
5
+ "steps": 31999878,
6
+ "file_path": "results/SoccerTwos5/SoccerTwos/SoccerTwos-31999878.onnx",
7
  "reward": 0.0,
8
+ "creation_time": 1680185500.9602473,
9
  "auxillary_file_paths": [
10
+ "results/SoccerTwos5/SoccerTwos/SoccerTwos-31999878.pt"
11
  ]
12
  },
13
  {
14
+ "steps": 32499928,
15
+ "file_path": "results/SoccerTwos5/SoccerTwos/SoccerTwos-32499928.onnx",
16
  "reward": 0.0,
17
+ "creation_time": 1680187156.8123388,
18
  "auxillary_file_paths": [
19
+ "results/SoccerTwos5/SoccerTwos/SoccerTwos-32499928.pt"
20
  ]
21
  },
22
  {
23
+ "steps": 32999999,
24
+ "file_path": "results/SoccerTwos5/SoccerTwos/SoccerTwos-32999999.onnx",
25
  "reward": 0.0,
26
+ "creation_time": 1680189217.7823765,
27
  "auxillary_file_paths": [
28
+ "results/SoccerTwos5/SoccerTwos/SoccerTwos-32999999.pt"
29
  ]
30
  },
31
  {
32
+ "steps": 33499982,
33
+ "file_path": "results/SoccerTwos5/SoccerTwos/SoccerTwos-33499982.onnx",
34
  "reward": 0.0,
35
+ "creation_time": 1680190866.9587436,
36
  "auxillary_file_paths": [
37
+ "results/SoccerTwos5/SoccerTwos/SoccerTwos-33499982.pt"
38
  ]
39
  },
40
  {
41
+ "steps": 33646596,
42
+ "file_path": "results/SoccerTwos5/SoccerTwos/SoccerTwos-33646596.onnx",
43
  "reward": 0.0,
44
+ "creation_time": 1680191712.6597888,
45
  "auxillary_file_paths": [
46
+ "results/SoccerTwos5/SoccerTwos/SoccerTwos-33646596.pt"
47
  ]
48
  }
49
  ],
50
+ "elo": 1786.6899060684966,
51
  "final_checkpoint": {
52
+ "steps": 33646596,
53
  "file_path": "results/SoccerTwos5/SoccerTwos.onnx",
54
  "reward": 0.0,
55
+ "creation_time": 1680191712.6597888,
56
  "auxillary_file_paths": [
57
+ "results/SoccerTwos5/SoccerTwos/SoccerTwos-33646596.pt"
58
  ]
59
  }
60
  },