voyzan commited on Sep 8, 2023

Commit

c28610d

•

1 Parent(s): e9bfd24

2

Browse files

Files changed (18) hide show

SnowballTarget.onnx +1 -1
SnowballTarget/SnowballTarget-149984.onnx +3 -0
SnowballTarget/SnowballTarget-149984.pt +3 -0
SnowballTarget/SnowballTarget-199984.onnx +3 -0
SnowballTarget/SnowballTarget-199984.pt +3 -0
SnowballTarget/SnowballTarget-200112.onnx +3 -0
SnowballTarget/SnowballTarget-200112.pt +3 -0
SnowballTarget/SnowballTarget-49936.onnx +3 -0
SnowballTarget/SnowballTarget-49936.pt +3 -0
SnowballTarget/SnowballTarget-99960.onnx +3 -0
SnowballTarget/SnowballTarget-99960.pt +3 -0
SnowballTarget/checkpoint.pt +1 -1
SnowballTarget/events.out.tfevents.1694195608.928acc295e7e.7575.0 +3 -0
config.json +1 -1
configuration.yaml +2 -2
run_logs/Player-0.log +13 -16
run_logs/timers.json +166 -158
run_logs/training_status.json +46 -10

SnowballTarget.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5edb4f53411dd7fb34a5fd60ccc6b42988727d6faea2e6ae1a014b2b9c034712
 size 326963

 version https://git-lfs.github.com/spec/v1
+oid sha256:bc1db10ba95558b18d2cd408b03b1cd9337223a534e3ceb1f1d10f0bc442d5e5
 size 326963

SnowballTarget/SnowballTarget-149984.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c70e5d048019add6698441063e43910f041071142a3bb4222810f1af8b7ec321
+size 326963

SnowballTarget/SnowballTarget-149984.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cb0f22094fb05e1ec05f155c2aaba5b2439e2d1424a9e74e942521c3c66ac725
+size 1938524

SnowballTarget/SnowballTarget-199984.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bc1db10ba95558b18d2cd408b03b1cd9337223a534e3ceb1f1d10f0bc442d5e5
+size 326963

SnowballTarget/SnowballTarget-199984.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:75826463ed21e9ff95f52126931f04d7ee672e75089d7153be85cab8fc05c75c
+size 1938524

SnowballTarget/SnowballTarget-200112.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bc1db10ba95558b18d2cd408b03b1cd9337223a534e3ceb1f1d10f0bc442d5e5
+size 326963

SnowballTarget/SnowballTarget-200112.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cc56d3fb4ef72e5649488db05eabc96b042a2bae13a4ce682ede131e06895362
+size 1938524

SnowballTarget/SnowballTarget-49936.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d0c775894399684c28722f0ddd77848f24c793715c7afa6763213fff7bc25775
+size 326963

SnowballTarget/SnowballTarget-49936.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b6b49154f4bbaae0c0c4a1cbc54e1531a1dc8522e55435139f8c4990e33a00e0
+size 1938524

SnowballTarget/SnowballTarget-99960.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a851c2c735210278f6b1a9a566f066e9fe9485fc36ee9e821910926a8bbe7c9b
+size 326963

SnowballTarget/SnowballTarget-99960.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:99c144ffbe8145e577c5c9fbdfa493427ff8fe6e401f1d4ceebf439e42ec0d0d
+size 1938524

SnowballTarget/checkpoint.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:492c3e3682251f7eb2f60e31854f3cb9bd4678e7d230f74d91cc7f571f440c39
 size 1938524

 version https://git-lfs.github.com/spec/v1
+oid sha256:cc56d3fb4ef72e5649488db05eabc96b042a2bae13a4ce682ede131e06895362
 size 1938524

SnowballTarget/events.out.tfevents.1694195608.928acc295e7e.7575.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f0b24ae30951e2705e05b12ea5ad7d5e9c577b63543fbc1ffd9c22f6f11ffad6
+size 28590

config.json CHANGED Viewed

@@ -1 +1 @@

- {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 256, "buffer_size": 4096, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.25, "lambd": 0.93, "num_epoch": 4, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 50000, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 3, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.95, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "even_checkpoints": false, "max_steps": ~~10000~~, "time_horizon": 64, "summary_freq": 10000, "threaded": true, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SnowballTarget/SnowballTarget", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true}, "environment_parameters": null, "checkpoint_settings": {"run_id": "~~SnowballTarget1~~", "initialize_from": null, "load_model": false, "resume": false, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

+ {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 256, "buffer_size": 4096, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.25, "lambd": 0.93, "num_epoch": 4, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 50000, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 3, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.95, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "even_checkpoints": false, "max_steps": 200000, "time_horizon": 64, "summary_freq": 10000, "threaded": true, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SnowballTarget/SnowballTarget", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SnowballTarget2", "initialize_from": null, "load_model": false, "resume": false, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

configuration.yaml CHANGED Viewed

@@ -38,7 +38,7 @@ behaviors:
     init_path: null
     keep_checkpoints: 10
     even_checkpoints: false
-    max_steps: 10000
     time_horizon: 64
     summary_freq: 10000
     threaded: true
@@ -64,7 +64,7 @@ engine_settings:
   no_graphics: true
 environment_parameters: null
 checkpoint_settings:
-  run_id: SnowballTarget1
   initialize_from: null
   load_model: false
   resume: false

     init_path: null
     keep_checkpoints: 10
     even_checkpoints: false
+    max_steps: 200000
     time_horizon: 64
     summary_freq: 10000
     threaded: true
   no_graphics: true
 environment_parameters: null
 checkpoint_settings:
+  run_id: SnowballTarget2
   initialize_from: null
   load_model: false
   resume: false

run_logs/Player-0.log CHANGED Viewed

@@ -2,9 +2,6 @@ Mono path[0] = '/content/ml-agents/training-envs-executables/linux/SnowballTarge
 Mono config path = '/content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/MonoBleedingEdge/etc'
 Preloaded 'lib_burst_generated.so'
 Preloaded 'libgrpc_csharp_ext.x64.so'
-PlayerPrefs - Creating folder: /root/.config/unity3d/Hugging Face
-PlayerPrefs - Creating folder: /root/.config/unity3d/Hugging Face/SnowballTarget
-Unable to load player prefs
 Initialize engine version: 2021.3.14f1 (eee1884e7226)
 [Subsystems] Discovering subsystems at path /content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/UnitySubsystems
 Forcing GfxDevice: Null
@@ -34,7 +31,7 @@ ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM default
 FMOD failed to initialize the output device.: "Error initializing output device. " (60)
 FMOD initialized on nosound output
 Begin MonoManager ReloadAssembly
-- Completed reload, in  0.081 seconds
 ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
@@ -45,7 +42,7 @@ ERROR: Shader Standard shader is not supported on this GPU (none of subshaders/f
 WARNING: Shader Unsupported: 'Standard' - All subshaders removed
 WARNING: Shader Did you use #pragma only_renderers and omit this platform?
 WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
-UnloadTime: 0.642858 ms
 ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 requesting resize 84 x 84
 Setting up 1 worker threads for Enlighten.
@@ -53,7 +50,7 @@ Memory Statistics:
 [ALLOC_TEMP_TLS] TLS Allocator
   StackAllocators :
     [ALLOC_TEMP_MAIN]
-      Peak usage frame count: [8.0 KB-16.0 KB]: 276 frames, [16.0 KB-32.0 KB]: 4 frames, [2.0 MB-4.0 MB]: 1 frames
       Initial Block Size 4.0 MB
       Current Block Size 4.0 MB
       Peak Allocated Bytes 2.0 MB
@@ -169,19 +166,19 @@ Memory Statistics:
       Peak Allocated Bytes 0 B
       Overflow Count 0
 [ALLOC_DEFAULT] Dual Thread Allocator
-  Peak main deferred allocation count 32
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_DEFAULT_MAIN]
-      Peak usage frame count: [4.0 MB-8.0 MB]: 281 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
-      Peak Allocated memory 5.2 MB
       Peak Large allocation bytes 0 B
     [ALLOC_DEFAULT_THREAD]
-      Peak usage frame count: [16.0 MB-32.0 MB]: 281 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 17.8 MB
@@ -213,13 +210,13 @@ Memory Statistics:
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_GFX_MAIN]
-      Peak usage frame count: [32.0 KB-64.0 KB]: 257 frames, [64.0 KB-128.0 KB]: 24 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 66.4 KB
       Peak Large allocation bytes 0 B
     [ALLOC_GFX_THREAD]
-      Peak usage frame count: [32.0 KB-64.0 KB]: 281 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 39.6 KB
@@ -231,13 +228,13 @@ Memory Statistics:
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_CACHEOBJECTS_MAIN]
-      Peak usage frame count: [0.5 MB-1.0 MB]: 281 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 0.6 MB
       Peak Large allocation bytes 0 B
     [ALLOC_CACHEOBJECTS_THREAD]
-      Peak usage frame count: [0.5 MB-1.0 MB]: 280 frames, [2.0 MB-4.0 MB]: 1 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 2.2 MB
@@ -249,13 +246,13 @@ Memory Statistics:
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_TYPETREE_MAIN]
-      Peak usage frame count: [0-1.0 KB]: 281 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.0 KB
       Peak Large allocation bytes 0 B
     [ALLOC_TYPETREE_THREAD]
-      Peak usage frame count: [1.0 KB-2.0 KB]: 281 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.7 KB

 Mono config path = '/content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/MonoBleedingEdge/etc'
 Preloaded 'lib_burst_generated.so'
 Preloaded 'libgrpc_csharp_ext.x64.so'
 Initialize engine version: 2021.3.14f1 (eee1884e7226)
 [Subsystems] Discovering subsystems at path /content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/UnitySubsystems
 Forcing GfxDevice: Null
 FMOD failed to initialize the output device.: "Error initializing output device. " (60)
 FMOD initialized on nosound output
 Begin MonoManager ReloadAssembly
+- Completed reload, in  0.085 seconds
 ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 WARNING: Shader Unsupported: 'Standard' - All subshaders removed
 WARNING: Shader Did you use #pragma only_renderers and omit this platform?
 WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
+UnloadTime: 0.626587 ms
 ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 requesting resize 84 x 84
 Setting up 1 worker threads for Enlighten.
 [ALLOC_TEMP_TLS] TLS Allocator
   StackAllocators :
     [ALLOC_TEMP_MAIN]
+      Peak usage frame count: [8.0 KB-16.0 KB]: 5369 frames, [16.0 KB-32.0 KB]: 91 frames, [2.0 MB-4.0 MB]: 1 frames
       Initial Block Size 4.0 MB
       Current Block Size 4.0 MB
       Peak Allocated Bytes 2.0 MB
       Peak Allocated Bytes 0 B
       Overflow Count 0
 [ALLOC_DEFAULT] Dual Thread Allocator
+  Peak main deferred allocation count 41
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_DEFAULT_MAIN]
+      Peak usage frame count: [4.0 MB-8.0 MB]: 5461 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
+      Peak Allocated memory 6.6 MB
       Peak Large allocation bytes 0 B
     [ALLOC_DEFAULT_THREAD]
+      Peak usage frame count: [16.0 MB-32.0 MB]: 5461 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 17.8 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_GFX_MAIN]
+      Peak usage frame count: [32.0 KB-64.0 KB]: 4613 frames, [64.0 KB-128.0 KB]: 848 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 66.4 KB
       Peak Large allocation bytes 0 B
     [ALLOC_GFX_THREAD]
+      Peak usage frame count: [32.0 KB-64.0 KB]: 5461 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 39.6 KB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_CACHEOBJECTS_MAIN]
+      Peak usage frame count: [0.5 MB-1.0 MB]: 5461 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 0.6 MB
       Peak Large allocation bytes 0 B
     [ALLOC_CACHEOBJECTS_THREAD]
+      Peak usage frame count: [0.5 MB-1.0 MB]: 5460 frames, [2.0 MB-4.0 MB]: 1 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 2.2 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_TYPETREE_MAIN]
+      Peak usage frame count: [0-1.0 KB]: 5461 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.0 KB
       Peak Large allocation bytes 0 B
     [ALLOC_TYPETREE_THREAD]
+      Peak usage frame count: [1.0 KB-2.0 KB]: 5461 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.7 KB

run_logs/timers.json CHANGED Viewed

@@ -2,213 +2,213 @@
     "name": "root",
     "gauges": {
         "SnowballTarget.Policy.Entropy.mean": {
-            "value": 2.8894050121307373,
-            "min": 2.8894050121307373,
-            "max": 2.8894050121307373,
-            "count": 1
         },
         "SnowballTarget.Policy.Entropy.sum": {
-            "value": 29653.96484375,
-            "min": 29653.96484375,
-            "max": 29653.96484375,
-            "count": 1
         },
         "SnowballTarget.Step.mean": {
-            "value": 9952.0,
             "min": 9952.0,
-            "max": 9952.0,
-            "count": 1
         },
         "SnowballTarget.Step.sum": {
-            "value": 9952.0,
             "min": 9952.0,
-            "max": 9952.0,
-            "count": 1
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
-            "value": 0.07252310961484909,
-            "min": 0.07252310961484909,
-            "max": 0.07252310961484909,
-            "count": 1
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
-            "value": 14.069483757019043,
-            "min": 14.069483757019043,
-            "max": 14.069483757019043,
-            "count": 1
         },
         "SnowballTarget.Environment.EpisodeLength.mean": {
             "value": 199.0,
             "min": 199.0,
             "max": 199.0,
-            "count": 1
         },
         "SnowballTarget.Environment.EpisodeLength.sum": {
             "value": 8756.0,
             "min": 8756.0,
-            "max": 8756.0,
-            "count": 1
         },
         "SnowballTarget.Environment.CumulativeReward.mean": {
-            "value": 2.5681818181818183,
-            "min": 2.5681818181818183,
-            "max": 2.5681818181818183,
-            "count": 1
         },
         "SnowballTarget.Environment.CumulativeReward.sum": {
-            "value": 113.0,
-            "min": 113.0,
-            "max": 113.0,
-            "count": 1
         },
         "SnowballTarget.Policy.ExtrinsicReward.mean": {
-            "value": 2.5681818181818183,
-            "min": 2.5681818181818183,
-            "max": 2.5681818181818183,
-            "count": 1
         },
         "SnowballTarget.Policy.ExtrinsicReward.sum": {
-            "value": 113.0,
-            "min": 113.0,
-            "max": 113.0,
-            "count": 1
         },
         "SnowballTarget.Losses.PolicyLoss.mean": {
-            "value": 0.048945861431712784,
-            "min": 0.048945861431712784,
-            "max": 0.048945861431712784,
-            "count": 1
         },
         "SnowballTarget.Losses.PolicyLoss.sum": {
-            "value": 0.09789172286342557,
-            "min": 0.09789172286342557,
-            "max": 0.09789172286342557,
-            "count": 1
         },
         "SnowballTarget.Losses.ValueLoss.mean": {
-            "value": 0.047466835674747604,
-            "min": 0.047466835674747604,
-            "max": 0.047466835674747604,
-            "count": 1
         },
         "SnowballTarget.Losses.ValueLoss.sum": {
-            "value": 0.09493367134949521,
-            "min": 0.09493367134949521,
-            "max": 0.09493367134949521,
-            "count": 1
         },
         "SnowballTarget.Policy.LearningRate.mean": {
-            "value": 0.00010464006512000002,
-            "min": 0.00010464006512000002,
-            "max": 0.00010464006512000002,
-            "count": 1
         },
         "SnowballTarget.Policy.LearningRate.sum": {
-            "value": 0.00020928013024000005,
-            "min": 0.00020928013024000005,
-            "max": 0.00020928013024000005,
-            "count": 1
         },
         "SnowballTarget.Policy.Epsilon.mean": {
-            "value": 0.15231999999999996,
-            "min": 0.15231999999999996,
-            "max": 0.15231999999999996,
-            "count": 1
         },
         "SnowballTarget.Policy.Epsilon.sum": {
-            "value": 0.3046399999999999,
-            "min": 0.3046399999999999,
-            "max": 0.3046399999999999,
-            "count": 1
         },
         "SnowballTarget.Policy.Beta.mean": {
-            "value": 0.0017505119999999999,
-            "min": 0.0017505119999999999,
-            "max": 0.0017505119999999999,
-            "count": 1
         },
         "SnowballTarget.Policy.Beta.sum": {
-            "value": 0.0035010239999999997,
-            "min": 0.0035010239999999997,
-            "max": 0.0035010239999999997,
-            "count": 1
         },
         "SnowballTarget.IsTraining.mean": {
             "value": 1.0,
             "min": 1.0,
             "max": 1.0,
-            "count": 1
         },
         "SnowballTarget.IsTraining.sum": {
             "value": 1.0,
             "min": 1.0,
             "max": 1.0,
-            "count": 1
         }
     },
     "metadata": {
         "timer_format_version": "0.1.0",
-        "start_time_seconds": "1694195380",
         "python_version": "3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]",
-        "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget1 --no-graphics",
         "mlagents_version": "0.31.0.dev0",
         "mlagents_envs_version": "0.31.0.dev0",
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "1.11.0+cu102",
         "numpy_version": "1.21.2",
-        "end_time_seconds": "1694195409"
     },
-    "total": 29.02839592800001,
     "count": 1,
-    "self": 0.4291761509996377,
     "children": {
         "run_training.setup": {
-            "total": 0.05066195000017615,
             "count": 1,
-            "self": 0.05066195000017615
         },
         "TrainerController.start_learning": {
-            "total": 28.548557827000195,
             "count": 1,
-            "self": 0.04960406900295311,
             "children": {
                 "TrainerController._reset_env": {
-                    "total": 4.073276859000089,
                     "count": 1,
-                    "self": 4.073276859000089
                 },
                 "TrainerController.advance": {
-                    "total": 24.27220436799712,
-                    "count": 934,
-                    "self": 0.013697022993483188,
                     "children": {
                         "env_step": {
-                            "total": 24.258507345003636,
-                            "count": 934,
-                            "self": 17.645529235004233,
                             "children": {
                                 "SubprocessEnvManager._take_step": {
-                                    "total": 6.599235522002118,
-                                    "count": 934,
-                                    "self": 0.0817164420006975,
                                     "children": {
                                         "TorchPolicy.evaluate": {
-                                            "total": 6.517519080001421,
-                                            "count": 934,
-                                            "self": 6.517519080001421
                                         }
                                     }
                                 },
                                 "workers": {
-                                    "total": 0.013742587997285227,
-                                    "count": 934,
                                     "self": 0.0,
                                     "children": {
                                         "worker_root": {
-                                            "total": 28.340408872997614,
-                                            "count": 934,
                                             "is_parallel": true,
-                                            "self": 15.729059506996236,
                                             "children": {
                                                 "run_training.setup": {
                                                     "total": 0.0,
@@ -217,48 +217,48 @@
                                                     "self": 0.0,
                                                     "children": {
                                                         "steps_from_proto": {
-                                                            "total": 0.0050898710001092695,
                                                             "count": 1,
                                                             "is_parallel": true,
-                                                            "self": 0.0035374720000618254,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
-                                                                    "total": 0.0015523990000474441,
                                                                     "count": 10,
                                                                     "is_parallel": true,
-                                                                    "self": 0.0015523990000474441
                                                                 }
                                                             }
                                                         },
                                                         "UnityEnvironment.step": {
-                                                            "total": 0.0375554289998945,
                                                             "count": 1,
                                                             "is_parallel": true,
-                                                            "self": 0.0006312569998954132,
                                                             "children": {
                                                                 "UnityEnvironment._generate_step_input": {
-                                                                    "total": 0.00037489600003937085,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.00037489600003937085
                                                                 },
                                                                 "communicator.exchange": {
-                                                                    "total": 0.03338095899994187,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.03338095899994187
                                                                 },
                                                                 "steps_from_proto": {
-                                                                    "total": 0.0031683170000178507,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.00040893699974731135,
                                                                     "children": {
                                                                         "_process_rank_one_or_two_observation": {
-                                                                            "total": 0.0027593800002705393,
                                                                             "count": 10,
                                                                             "is_parallel": true,
-                                                                            "self": 0.0027593800002705393
                                                                         }
                                                                     }
                                                                 }
@@ -267,34 +267,34 @@
                                                     }
                                                 },
                                                 "UnityEnvironment.step": {
-                                                    "total": 12.611349366001377,
-                                                    "count": 933,
                                                     "is_parallel": true,
-                                                    "self": 0.537294581010201,
                                                     "children": {
                                                         "UnityEnvironment._generate_step_input": {
-                                                            "total": 0.27039484499505306,
-                                                            "count": 933,
                                                             "is_parallel": true,
-                                                            "self": 0.27039484499505306
                                                         },
                                                         "communicator.exchange": {
-                                                            "total": 9.939632270995617,
-                                                            "count": 933,
                                                             "is_parallel": true,
-                                                            "self": 9.939632270995617
                                                         },
                                                         "steps_from_proto": {
-                                                            "total": 1.8640276690005066,
-                                                            "count": 933,
                                                             "is_parallel": true,
-                                                            "self": 0.34912224099684863,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
-                                                                    "total": 1.514905428003658,
-                                                                    "count": 9330,
                                                                     "is_parallel": true,
-                                                                    "self": 1.514905428003658
                                                                 }
                                                             }
                                                         }
@@ -309,9 +309,9 @@
                     }
                 },
                 "trainer_threads": {
-                    "total": 0.00023283299992726825,
                     "count": 1,
-                    "self": 0.00023283299992726825,
                     "children": {
                         "thread_root": {
                             "total": 0.0,
@@ -320,28 +320,36 @@
                             "self": 0.0,
                             "children": {
                                 "trainer_advance": {
-                                    "total": 24.048281263001627,
-                                    "count": 29422,
                                     "is_parallel": true,
-                                    "self": 0.644191267008182,
                                     "children": {
                                         "process_trajectory": {
-                                            "total": 16.19414100299332,
-                                            "count": 29422,
                                             "is_parallel": true,
-                                            "self": 16.19414100299332
                                         },
                                         "_update_policy": {
-                                            "total": 7.2099489930001255,
-                                            "count": 2,
                                             "is_parallel": true,
-                                            "self": 4.056289224001148,
                                             "children": {
                                                 "TorchPPOOptimizer.update": {
-                                                    "total": 3.1536597689989776,
-                                                    "count": 132,
                                                     "is_parallel": true,
-                                                    "self": 3.1536597689989776
                                                 }
                                             }
                                         }
@@ -352,14 +360,14 @@
                     }
                 },
                 "TrainerController._save_models": {
-                    "total": 0.15323969800010673,
                     "count": 1,
-                    "self": 0.0006165100000998791,
                     "children": {
                         "RLTrainer._checkpoint": {
-                            "total": 0.15262318800000685,
                             "count": 1,
-                            "self": 0.15262318800000685
                         }
                     }
                 }

     "name": "root",
     "gauges": {
         "SnowballTarget.Policy.Entropy.mean": {
+            "value": 1.0823804140090942,
+            "min": 1.0823804140090942,
+            "max": 2.8865561485290527,
+            "count": 20
         },
         "SnowballTarget.Policy.Entropy.sum": {
+            "value": 10358.380859375,
+            "min": 10358.380859375,
+            "max": 29624.724609375,
+            "count": 20
         },
         "SnowballTarget.Step.mean": {
+            "value": 199984.0,
             "min": 9952.0,
+            "max": 199984.0,
+            "count": 20
         },
         "SnowballTarget.Step.sum": {
+            "value": 199984.0,
             "min": 9952.0,
+            "max": 199984.0,
+            "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
+            "value": 2.567681312561035,
+            "min": 0.09589726477861404,
+            "max": 2.574761390686035,
+            "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
+            "value": 500.6978759765625,
+            "min": 18.604068756103516,
+            "max": 525.2513427734375,
+            "count": 20
         },
         "SnowballTarget.Environment.EpisodeLength.mean": {
             "value": 199.0,
             "min": 199.0,
             "max": 199.0,
+            "count": 20
         },
         "SnowballTarget.Environment.EpisodeLength.sum": {
             "value": 8756.0,
             "min": 8756.0,
+            "max": 10945.0,
+            "count": 20
         },
         "SnowballTarget.Environment.CumulativeReward.mean": {
+            "value": 25.15909090909091,
+            "min": 3.272727272727273,
+            "max": 25.386363636363637,
+            "count": 20
         },
         "SnowballTarget.Environment.CumulativeReward.sum": {
+            "value": 1107.0,
+            "min": 144.0,
+            "max": 1389.0,
+            "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicReward.mean": {
+            "value": 25.15909090909091,
+            "min": 3.272727272727273,
+            "max": 25.386363636363637,
+            "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicReward.sum": {
+            "value": 1107.0,
+            "min": 144.0,
+            "max": 1389.0,
+            "count": 20
         },
         "SnowballTarget.Losses.PolicyLoss.mean": {
+            "value": 0.05303531138120246,
+            "min": 0.043000292613321695,
+            "max": 0.05497397439595421,
+            "count": 20
         },
         "SnowballTarget.Losses.PolicyLoss.sum": {
+            "value": 0.10607062276240492,
+            "min": 0.08600058522664339,
+            "max": 0.15276711164316273,
+            "count": 20
         },
         "SnowballTarget.Losses.ValueLoss.mean": {
+            "value": 0.12043402075548382,
+            "min": 0.05885272711833857,
+            "max": 0.1406230588498361,
+            "count": 20
         },
         "SnowballTarget.Losses.ValueLoss.sum": {
+            "value": 0.24086804151096763,
+            "min": 0.11770545423667714,
+            "max": 0.4104643968098304,
+            "count": 20
         },
         "SnowballTarget.Policy.LearningRate.mean": {
+            "value": 6.432097856000006e-06,
+            "min": 6.432097856000006e-06,
+            "max": 0.00029023200325599993,
+            "count": 20
         },
         "SnowballTarget.Policy.LearningRate.sum": {
+            "value": 1.2864195712000013e-05,
+            "min": 1.2864195712000013e-05,
+            "max": 0.0007419960526679999,
+            "count": 20
         },
         "SnowballTarget.Policy.Epsilon.mean": {
+            "value": 0.10321600000000003,
+            "min": 0.10321600000000003,
+            "max": 0.24511600000000003,
+            "count": 20
         },
         "SnowballTarget.Policy.Epsilon.sum": {
+            "value": 0.20643200000000006,
+            "min": 0.20643200000000006,
+            "max": 0.6709980000000001,
+            "count": 20
         },
         "SnowballTarget.Policy.Beta.mean": {
+            "value": 0.00011698560000000007,
+            "min": 0.00011698560000000007,
+            "max": 0.004837525599999999,
+            "count": 20
         },
         "SnowballTarget.Policy.Beta.sum": {
+            "value": 0.00023397120000000015,
+            "min": 0.00023397120000000015,
+            "max": 0.012371866800000002,
+            "count": 20
         },
         "SnowballTarget.IsTraining.mean": {
             "value": 1.0,
             "min": 1.0,
             "max": 1.0,
+            "count": 20
         },
         "SnowballTarget.IsTraining.sum": {
             "value": 1.0,
             "min": 1.0,
             "max": 1.0,
+            "count": 20
         }
     },
     "metadata": {
         "timer_format_version": "0.1.0",
+        "start_time_seconds": "1694195607",
         "python_version": "3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]",
+        "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget2 --no-graphics",
         "mlagents_version": "0.31.0.dev0",
         "mlagents_envs_version": "0.31.0.dev0",
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "1.11.0+cu102",
         "numpy_version": "1.21.2",
+        "end_time_seconds": "1694196083"
     },
+    "total": 475.86589398,
     "count": 1,
+    "self": 0.43534228899966365,
     "children": {
         "run_training.setup": {
+            "total": 0.03870379100021637,
             "count": 1,
+            "self": 0.03870379100021637
         },
         "TrainerController.start_learning": {
+            "total": 475.39184790000013,
             "count": 1,
+            "self": 0.5261172999864812,
             "children": {
                 "TrainerController._reset_env": {
+                    "total": 3.8278629380001803,
                     "count": 1,
+                    "self": 3.8278629380001803
                 },
                 "TrainerController.advance": {
+                    "total": 470.90342204901344,
+                    "count": 18202,
+                    "self": 0.2622811350365737,
                     "children": {
                         "env_step": {
+                            "total": 470.64114091397687,
+                            "count": 18202,
+                            "self": 348.71422680298383,
                             "children": {
                                 "SubprocessEnvManager._take_step": {
+                                    "total": 121.66394710200075,
+                                    "count": 18202,
+                                    "self": 1.755945177010517,
                                     "children": {
                                         "TorchPolicy.evaluate": {
+                                            "total": 119.90800192499023,
+                                            "count": 18202,
+                                            "self": 119.90800192499023
                                         }
                                     }
                                 },
                                 "workers": {
+                                    "total": 0.2629670089922911,
+                                    "count": 18202,
                                     "self": 0.0,
                                     "children": {
                                         "worker_root": {
+                                            "total": 473.8338290559757,
+                                            "count": 18202,
                                             "is_parallel": true,
+                                            "self": 236.80496419895894,
                                             "children": {
                                                 "run_training.setup": {
                                                     "total": 0.0,
                                                     "self": 0.0,
                                                     "children": {
                                                         "steps_from_proto": {
+                                                            "total": 0.0018615440001212846,
                                                             "count": 1,
                                                             "is_parallel": true,
+                                                            "self": 0.0005025840000598691,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
+                                                                    "total": 0.0013589600000614155,
                                                                     "count": 10,
                                                                     "is_parallel": true,
+                                                                    "self": 0.0013589600000614155
                                                                 }
                                                             }
                                                         },
                                                         "UnityEnvironment.step": {
+                                                            "total": 0.03816275599979235,
                                                             "count": 1,
                                                             "is_parallel": true,
+                                                            "self": 0.0006009799997173104,
                                                             "children": {
                                                                 "UnityEnvironment._generate_step_input": {
+                                                                    "total": 0.00033410600008210167,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.00033410600008210167
                                                                 },
                                                                 "communicator.exchange": {
+                                                                    "total": 0.0350276470001063,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.0350276470001063
                                                                 },
                                                                 "steps_from_proto": {
+                                                                    "total": 0.0022000229998866416,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.000523639999983061,
                                                                     "children": {
                                                                         "_process_rank_one_or_two_observation": {
+                                                                            "total": 0.0016763829999035806,
                                                                             "count": 10,
                                                                             "is_parallel": true,
+                                                                            "self": 0.0016763829999035806
                                                                         }
                                                                     }
                                                                 }
                                                     }
                                                 },
                                                 "UnityEnvironment.step": {
+                                                    "total": 237.02886485701674,
+                                                    "count": 18201,
                                                     "is_parallel": true,
+                                                    "self": 10.0921474280849,
                                                     "children": {
                                                         "UnityEnvironment._generate_step_input": {
+                                                            "total": 5.2441317659774995,
+                                                            "count": 18201,
                                                             "is_parallel": true,
+                                                            "self": 5.2441317659774995
                                                         },
                                                         "communicator.exchange": {
+                                                            "total": 186.9509997249993,
+                                                            "count": 18201,
                                                             "is_parallel": true,
+                                                            "self": 186.9509997249993
                                                         },
                                                         "steps_from_proto": {
+                                                            "total": 34.74158593795505,
+                                                            "count": 18201,
                                                             "is_parallel": true,
+                                                            "self": 6.252948916890773,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
+                                                                    "total": 28.488637021064278,
+                                                                    "count": 182010,
                                                                     "is_parallel": true,
+                                                                    "self": 28.488637021064278
                                                                 }
                                                             }
                                                         }
                     }
                 },
                 "trainer_threads": {
+                    "total": 0.00015687999984947965,
                     "count": 1,
+                    "self": 0.00015687999984947965,
                     "children": {
                         "thread_root": {
                             "total": 0.0,
                             "self": 0.0,
                             "children": {
                                 "trainer_advance": {
+                                    "total": 466.432363791929,
+                                    "count": 526672,
                                     "is_parallel": true,
+                                    "self": 11.80509066705963,
                                     "children": {
                                         "process_trajectory": {
+                                            "total": 299.5110636478719,
+                                            "count": 526672,
                                             "is_parallel": true,
+                                            "self": 298.73790789987197,
+                                            "children": {
+                                                "RLTrainer._checkpoint": {
+                                                    "total": 0.7731557479999083,
+                                                    "count": 4,
+                                                    "is_parallel": true,
+                                                    "self": 0.7731557479999083
+                                                }
+                                            }
                                         },
                                         "_update_policy": {
+                                            "total": 155.11620947699748,
+                                            "count": 45,
                                             "is_parallel": true,
+                                            "self": 87.08159226400198,
                                             "children": {
                                                 "TorchPPOOptimizer.update": {
+                                                    "total": 68.0346172129955,
+                                                    "count": 3056,
                                                     "is_parallel": true,
+                                                    "self": 68.0346172129955
                                                 }
                                             }
                                         }
                     }
                 },
                 "TrainerController._save_models": {
+                    "total": 0.13428873300017585,
                     "count": 1,
+                    "self": 0.0006541750003634661,
                     "children": {
                         "RLTrainer._checkpoint": {
+                            "total": 0.1336345579998124,
                             "count": 1,
+                            "self": 0.1336345579998124
                         }
                     }
                 }

run_logs/training_status.json CHANGED Viewed

@@ -2,22 +2,58 @@
     "SnowballTarget": {
         "checkpoints": [
             {
-                "steps": 10208,
-                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-10208.onnx",
-                "reward": 2.5454545454545454,
-                "creation_time": 1694195408.9938948,
                 "auxillary_file_paths": [
-                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-10208.pt"
                 ]
             }
         ],
         "final_checkpoint": {
-            "steps": 10208,
-            "file_path": "results/SnowballTarget1/SnowballTarget.onnx",
-            "reward": 2.5454545454545454,
-            "creation_time": 1694195408.9938948,
             "auxillary_file_paths": [
-                "results/SnowballTarget1/SnowballTarget/SnowballTarget-10208.pt"
             ]
         }
     },

     "SnowballTarget": {
         "checkpoints": [
             {
+                "steps": 49936,
+                "file_path": "results/SnowballTarget2/SnowballTarget/SnowballTarget-49936.onnx",
+                "reward": 12.0,
+                "creation_time": 1694195729.460012,
                 "auxillary_file_paths": [
+                    "results/SnowballTarget2/SnowballTarget/SnowballTarget-49936.pt"
+                ]
+            },
+            {
+                "steps": 99960,
+                "file_path": "results/SnowballTarget2/SnowballTarget/SnowballTarget-99960.onnx",
+                "reward": 18.90909090909091,
+                "creation_time": 1694195846.0612614,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget2/SnowballTarget/SnowballTarget-99960.pt"
+                ]
+            },
+            {
+                "steps": 149984,
+                "file_path": "results/SnowballTarget2/SnowballTarget/SnowballTarget-149984.onnx",
+                "reward": 25.636363636363637,
+                "creation_time": 1694195964.9191837,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget2/SnowballTarget/SnowballTarget-149984.pt"
+                ]
+            },
+            {
+                "steps": 199984,
+                "file_path": "results/SnowballTarget2/SnowballTarget/SnowballTarget-199984.onnx",
+                "reward": 25.545454545454547,
+                "creation_time": 1694196083.1622114,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget2/SnowballTarget/SnowballTarget-199984.pt"
+                ]
+            },
+            {
+                "steps": 200112,
+                "file_path": "results/SnowballTarget2/SnowballTarget/SnowballTarget-200112.onnx",
+                "reward": 25.545454545454547,
+                "creation_time": 1694196083.3159246,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget2/SnowballTarget/SnowballTarget-200112.pt"
                 ]
             }
         ],
         "final_checkpoint": {
+            "steps": 200112,
+            "file_path": "results/SnowballTarget2/SnowballTarget.onnx",
+            "reward": 25.545454545454547,
+            "creation_time": 1694196083.3159246,
             "auxillary_file_paths": [
+                "results/SnowballTarget2/SnowballTarget/SnowballTarget-200112.pt"
             ]
         }
     },