xenjin450 commited on Feb 4, 2025

Commit

3686dfb

verified ·

1 Parent(s): bab2d69

First Push

Browse files

Files changed (18) hide show

SnowballTarget.onnx +1 -1
SnowballTarget/SnowballTarget-149984.onnx +1 -1
SnowballTarget/SnowballTarget-149984.pt +1 -1
SnowballTarget/SnowballTarget-199984.onnx +1 -1
SnowballTarget/SnowballTarget-199984.pt +1 -1
SnowballTarget/SnowballTarget-200112.onnx +1 -1
SnowballTarget/SnowballTarget-200112.pt +1 -1
SnowballTarget/SnowballTarget-49936.onnx +1 -1
SnowballTarget/SnowballTarget-49936.pt +1 -1
SnowballTarget/SnowballTarget-99960.onnx +1 -1
SnowballTarget/SnowballTarget-99960.pt +1 -1
SnowballTarget/checkpoint.pt +1 -1
SnowballTarget/events.out.tfevents.1738662695.cf106d47a9e7.27596.0 +3 -0
config.json +1 -1
configuration.yaml +1 -1
run_logs/Player-0.log +15 -18
run_logs/timers.json +114 -114
run_logs/training_status.json +24 -24

SnowballTarget.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1b6b14d913bf1e960102b05e9bd571bb5497370286c413ad4d31f24d2dde58b4
 size 2867524

 version https://git-lfs.github.com/spec/v1
+oid sha256:fba36e777d5bd4ad44c8c47254c42c798ce75ca3ac9be588978bff97f043781e
 size 2867524

SnowballTarget/SnowballTarget-149984.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4bd50844df617ded0127cb2adbfe4e7410615eef4a143ebd27b6d0a2cfbdbeca
 size 2867524

 version https://git-lfs.github.com/spec/v1
+oid sha256:c3dd4ddb6c472fc69b3e6993dd975b0d60002586d06d353739137e8994d321df
 size 2867524

SnowballTarget/SnowballTarget-149984.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4f7786c33bd6395cb90224e3f2252ead95175deab831527f2de41f53b8ef45fb
 size 8602051

 version https://git-lfs.github.com/spec/v1
+oid sha256:63dde6fa5637b4687a830db62b1269e2ec48b920f7151182db24831fa872fbf5
 size 8602051

SnowballTarget/SnowballTarget-199984.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1b6b14d913bf1e960102b05e9bd571bb5497370286c413ad4d31f24d2dde58b4
 size 2867524

 version https://git-lfs.github.com/spec/v1
+oid sha256:fba36e777d5bd4ad44c8c47254c42c798ce75ca3ac9be588978bff97f043781e
 size 2867524

SnowballTarget/SnowballTarget-199984.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:87f937f9b81222cc7c89cd9241a30dd95e6c9cde0f3151cd3c60c545a3e34a77
 size 8602051

 version https://git-lfs.github.com/spec/v1
+oid sha256:8c646be6cfaa197fdfa4ad52e195debbde3114867213876439943d1e01765d0a
 size 8602051

SnowballTarget/SnowballTarget-200112.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1b6b14d913bf1e960102b05e9bd571bb5497370286c413ad4d31f24d2dde58b4
 size 2867524

 version https://git-lfs.github.com/spec/v1
+oid sha256:fba36e777d5bd4ad44c8c47254c42c798ce75ca3ac9be588978bff97f043781e
 size 2867524

SnowballTarget/SnowballTarget-200112.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3e6b9cf487035a53140bf51bfb8d99907edfd4ef1c1d5bb6ca490c77467c6b1a
 size 8602051

 version https://git-lfs.github.com/spec/v1
+oid sha256:e245d753fde57345c59e202761bdbd18453720c0bc3663bb8812a04b8b7ec743
 size 8602051

SnowballTarget/SnowballTarget-49936.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e04c4e97a937f7f7313ab074ef2532d68117afcf882c7505790a0ffeaf9240ef
 size 2867524

 version https://git-lfs.github.com/spec/v1
+oid sha256:67cbe5bceadb5985faf275c35e18e8a7b5221008dbb14a4ee987b58b759b8b10
 size 2867524

SnowballTarget/SnowballTarget-49936.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:541471f68df4b0c24c5c8b86ef99f9528e090961010d3536a1ac6a748cc381d3
 size 8601984

 version https://git-lfs.github.com/spec/v1
+oid sha256:6401e587119f53ba2091f01f6f4dfac935adcf7f8a456c28eeb4343e3ea7f659
 size 8601984

SnowballTarget/SnowballTarget-99960.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:76e04cae2c70f630b8ec70956f4db67ccb928afd1d807824467bee8074c4d822
 size 2867524

 version https://git-lfs.github.com/spec/v1
+oid sha256:dde983107ba9f5ae0bc056f3ef52bde092499f8e7b462888d2d7edac01fcefeb
 size 2867524

SnowballTarget/SnowballTarget-99960.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e0d9a36f95dd53a3301fe027639d6a8305515c8848d28cb726590b68a3279f5a
 size 8601984

 version https://git-lfs.github.com/spec/v1
+oid sha256:73b6df79113e429214a74a7a4190337c9165e8870ab74320b872f6c994b79b34
 size 8601984

SnowballTarget/checkpoint.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2183003596300821515724220666562428395d8c1aea3fb4314701b224402180
 size 8601314

 version https://git-lfs.github.com/spec/v1
+oid sha256:22e5e1e9d7ee1ee37fc2efe51988cea705d385a9b0a9a14f8a93f68f6f205f72
 size 8601314

SnowballTarget/events.out.tfevents.1738662695.cf106d47a9e7.27596.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1aba77e079ad03c2ae3baeef5fc57115ce724749d78911a633acb98c7422aa27
+size 28202

config.json CHANGED Viewed

@@ -1 +1 @@

- {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 512, "buffer_size": 2048, "learning_rate": 0.0004, "beta": 0.005, "epsilon": 0.3, "lambd": 0.95, "num_epoch": 5, "shared_critic": true, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 50000, "network_settings": {"normalize": false, "hidden_units": 512, "num_layers": 3, "vis_encode_type": "resnet", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "even_checkpoints": false, "max_steps": 200000, "time_horizon": 64, "summary_freq": 10000, "threaded": true, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SnowballTarget/SnowballTarget", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "~~SnowballTargetRLXenjin450~~", "initialize_from": null, "load_model": false, "resume": false, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

+ {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 512, "buffer_size": 2048, "learning_rate": 0.0004, "beta": 0.005, "epsilon": 0.3, "lambd": 0.95, "num_epoch": 5, "shared_critic": true, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 50000, "network_settings": {"normalize": false, "hidden_units": 512, "num_layers": 3, "vis_encode_type": "resnet", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "even_checkpoints": false, "max_steps": 200000, "time_horizon": 64, "summary_freq": 10000, "threaded": true, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SnowballTarget/SnowballTarget", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SnowballTargetXenjin450", "initialize_from": null, "load_model": false, "resume": false, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

configuration.yaml CHANGED Viewed

@@ -66,7 +66,7 @@ engine_settings:
   no_graphics_monitor: false
 environment_parameters: null
 checkpoint_settings:
-  run_id: SnowballTargetRLXenjin450
   initialize_from: null
   load_model: false
   resume: false

   no_graphics_monitor: false
 environment_parameters: null
 checkpoint_settings:
+  run_id: SnowballTargetXenjin450
   initialize_from: null
   load_model: false
   resume: false

run_logs/Player-0.log CHANGED Viewed

@@ -2,9 +2,6 @@ Mono path[0] = '/content/ml-agents/training-envs-executables/linux/SnowballTarge
 Mono config path = '/content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/MonoBleedingEdge/etc'
 Preloaded 'lib_burst_generated.so'
 Preloaded 'libgrpc_csharp_ext.x64.so'
-PlayerPrefs - Creating folder: /root/.config/unity3d/Hugging Face
-PlayerPrefs - Creating folder: /root/.config/unity3d/Hugging Face/SnowballTarget
-Unable to load player prefs
 Initialize engine version: 2021.3.14f1 (eee1884e7226)
 [Subsystems] Discovering subsystems at path /content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/UnitySubsystems
 Forcing GfxDevice: Null
@@ -34,7 +31,7 @@ ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM default
 FMOD failed to initialize the output device.: "Error initializing output device. " (60)
 FMOD initialized on nosound output
 Begin MonoManager ReloadAssembly
-- Completed reload, in  0.147 seconds
 ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
@@ -45,7 +42,7 @@ ERROR: Shader Standard shader is not supported on this GPU (none of subshaders/f
 WARNING: Shader Unsupported: 'Standard' - All subshaders removed
 WARNING: Shader Did you use #pragma only_renderers and omit this platform?
 WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
-UnloadTime: 1.076136 ms
 ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 requesting resize 84 x 84
 Setting up 1 worker threads for Enlighten.
@@ -53,7 +50,7 @@ Memory Statistics:
 [ALLOC_TEMP_TLS] TLS Allocator
   StackAllocators :
     [ALLOC_TEMP_MAIN]
-      Peak usage frame count: [8.0 KB-16.0 KB]: 5371 frames, [16.0 KB-32.0 KB]: 91 frames, [2.0 MB-4.0 MB]: 1 frames
       Initial Block Size 4.0 MB
       Current Block Size 4.0 MB
       Peak Allocated Bytes 2.0 MB
@@ -169,22 +166,22 @@ Memory Statistics:
       Peak Allocated Bytes 0 B
       Overflow Count 0
 [ALLOC_DEFAULT] Dual Thread Allocator
-  Peak main deferred allocation count 41
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_DEFAULT_MAIN]
-      Peak usage frame count: [4.0 MB-8.0 MB]: 5463 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
-      Peak Allocated memory 7.1 MB
       Peak Large allocation bytes 0 B
     [ALLOC_DEFAULT_THREAD]
-      Peak usage frame count: [16.0 MB-32.0 MB]: 5463 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
-      Peak Allocated memory 17.4 MB
       Peak Large allocation bytes 16.0 MB
 [ALLOC_TEMP_JOB_1_FRAME]
   Initial Block Size 2.0 MB
@@ -213,13 +210,13 @@ Memory Statistics:
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_GFX_MAIN]
-      Peak usage frame count: [32.0 KB-64.0 KB]: 5082 frames, [64.0 KB-128.0 KB]: 381 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
-      Peak Allocated memory 66.4 KB
       Peak Large allocation bytes 0 B
     [ALLOC_GFX_THREAD]
-      Peak usage frame count: [32.0 KB-64.0 KB]: 5463 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 39.6 KB
@@ -231,13 +228,13 @@ Memory Statistics:
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_CACHEOBJECTS_MAIN]
-      Peak usage frame count: [0.5 MB-1.0 MB]: 5463 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 0.6 MB
       Peak Large allocation bytes 0 B
     [ALLOC_CACHEOBJECTS_THREAD]
-      Peak usage frame count: [0.5 MB-1.0 MB]: 5462 frames, [2.0 MB-4.0 MB]: 1 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 2.2 MB
@@ -249,13 +246,13 @@ Memory Statistics:
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_TYPETREE_MAIN]
-      Peak usage frame count: [0-1.0 KB]: 5463 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.0 KB
       Peak Large allocation bytes 0 B
     [ALLOC_TYPETREE_THREAD]
-      Peak usage frame count: [1.0 KB-2.0 KB]: 5463 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.7 KB

 Mono config path = '/content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/MonoBleedingEdge/etc'
 Preloaded 'lib_burst_generated.so'
 Preloaded 'libgrpc_csharp_ext.x64.so'
 Initialize engine version: 2021.3.14f1 (eee1884e7226)
 [Subsystems] Discovering subsystems at path /content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/UnitySubsystems
 Forcing GfxDevice: Null
 FMOD failed to initialize the output device.: "Error initializing output device. " (60)
 FMOD initialized on nosound output
 Begin MonoManager ReloadAssembly
+- Completed reload, in  0.195 seconds
 ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 WARNING: Shader Unsupported: 'Standard' - All subshaders removed
 WARNING: Shader Did you use #pragma only_renderers and omit this platform?
 WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
+UnloadTime: 2.455169 ms
 ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 requesting resize 84 x 84
 Setting up 1 worker threads for Enlighten.
 [ALLOC_TEMP_TLS] TLS Allocator
   StackAllocators :
     [ALLOC_TEMP_MAIN]
+      Peak usage frame count: [8.0 KB-16.0 KB]: 5370 frames, [16.0 KB-32.0 KB]: 91 frames, [2.0 MB-4.0 MB]: 1 frames
       Initial Block Size 4.0 MB
       Current Block Size 4.0 MB
       Peak Allocated Bytes 2.0 MB
       Peak Allocated Bytes 0 B
       Overflow Count 0
 [ALLOC_DEFAULT] Dual Thread Allocator
+  Peak main deferred allocation count 45
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_DEFAULT_MAIN]
+      Peak usage frame count: [4.0 MB-8.0 MB]: 5462 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
+      Peak Allocated memory 6.7 MB
       Peak Large allocation bytes 0 B
     [ALLOC_DEFAULT_THREAD]
+      Peak usage frame count: [16.0 MB-32.0 MB]: 5462 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
+      Peak Allocated memory 17.8 MB
       Peak Large allocation bytes 16.0 MB
 [ALLOC_TEMP_JOB_1_FRAME]
   Initial Block Size 2.0 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_GFX_MAIN]
+      Peak usage frame count: [32.0 KB-64.0 KB]: 3911 frames, [64.0 KB-128.0 KB]: 1551 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
+      Peak Allocated memory 67.6 KB
       Peak Large allocation bytes 0 B
     [ALLOC_GFX_THREAD]
+      Peak usage frame count: [32.0 KB-64.0 KB]: 5462 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 39.6 KB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_CACHEOBJECTS_MAIN]
+      Peak usage frame count: [0.5 MB-1.0 MB]: 5462 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 0.6 MB
       Peak Large allocation bytes 0 B
     [ALLOC_CACHEOBJECTS_THREAD]
+      Peak usage frame count: [0.5 MB-1.0 MB]: 5461 frames, [2.0 MB-4.0 MB]: 1 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 2.2 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_TYPETREE_MAIN]
+      Peak usage frame count: [0-1.0 KB]: 5462 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.0 KB
       Peak Large allocation bytes 0 B
     [ALLOC_TYPETREE_THREAD]
+      Peak usage frame count: [1.0 KB-2.0 KB]: 5462 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.7 KB

run_logs/timers.json CHANGED Viewed

@@ -2,15 +2,15 @@
     "name": "root",
     "gauges": {
         "SnowballTarget.Policy.Entropy.mean": {
-            "value": 0.7426327466964722,
-            "min": 0.731351375579834,
-            "max": 2.87078595161438,
             "count": 20
         },
         "SnowballTarget.Policy.Entropy.sum": {
-            "value": 7115.1640625,
-            "min": 7115.1640625,
-            "max": 29494.455078125,
             "count": 20
         },
         "SnowballTarget.Step.mean": {
@@ -26,15 +26,15 @@
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
-            "value": 13.157102584838867,
-            "min": 0.40423882007598877,
-            "max": 13.203481674194336,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
-            "value": 2565.635009765625,
-            "min": 78.42233276367188,
-            "max": 2693.51025390625,
             "count": 20
         },
         "SnowballTarget.Environment.EpisodeLength.mean": {
@@ -50,27 +50,27 @@
             "count": 20
         },
         "SnowballTarget.Losses.PolicyLoss.mean": {
-            "value": 0.03378662246068416,
-            "min": 0.024719062141757602,
-            "max": 0.03549714893844794,
             "count": 20
         },
         "SnowballTarget.Losses.PolicyLoss.sum": {
-            "value": 0.13514648984273664,
-            "min": 0.10262200149154523,
-            "max": 0.17748574469223968,
             "count": 20
         },
         "SnowballTarget.Losses.ValueLoss.mean": {
-            "value": 0.20805656611919401,
-            "min": 0.13371476717293262,
-            "max": 0.30642091631889345,
             "count": 20
         },
         "SnowballTarget.Losses.ValueLoss.sum": {
-            "value": 0.8322262644767761,
-            "min": 0.5348590686917305,
-            "max": 1.4480631172657012,
             "count": 20
         },
         "SnowballTarget.Policy.LearningRate.mean": {
@@ -82,7 +82,7 @@
         "SnowballTarget.Policy.LearningRate.sum": {
             "value": 4.310438922400004e-05,
             "min": 4.310438922400004e-05,
-            "max": 0.0018470080382480003,
             "count": 20
         },
         "SnowballTarget.Policy.Epsilon.mean": {
@@ -94,7 +94,7 @@
         "SnowballTarget.Policy.Epsilon.sum": {
             "value": 0.421552,
             "min": 0.421552,
-            "max": 1.423504,
             "count": 20
         },
         "SnowballTarget.Policy.Beta.mean": {
@@ -106,31 +106,31 @@
         "SnowballTarget.Policy.Beta.sum": {
             "value": 0.0005777224000000006,
             "min": 0.0005777224000000006,
-            "max": 0.0230914248,
             "count": 20
         },
         "SnowballTarget.Environment.CumulativeReward.mean": {
-            "value": 26.0,
-            "min": 3.409090909090909,
-            "max": 26.113636363636363,
             "count": 20
         },
         "SnowballTarget.Environment.CumulativeReward.sum": {
-            "value": 1144.0,
-            "min": 150.0,
-            "max": 1424.0,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicReward.mean": {
-            "value": 26.0,
-            "min": 3.409090909090909,
-            "max": 26.113636363636363,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicReward.sum": {
-            "value": 1144.0,
-            "min": 150.0,
-            "max": 1424.0,
             "count": 20
         },
         "SnowballTarget.IsTraining.mean": {
@@ -148,67 +148,67 @@
     },
     "metadata": {
         "timer_format_version": "0.1.0",
-        "start_time_seconds": "1738656550",
         "python_version": "3.10.12 (main, Jul  5 2023, 18:54:27) [GCC 11.2.0]",
-        "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowBallTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTargetRLXenjin450 --no-graphics",
         "mlagents_version": "1.2.0.dev0",
         "mlagents_envs_version": "1.2.0.dev0",
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "2.6.0+cu124",
         "numpy_version": "1.23.5",
-        "end_time_seconds": "1738657315"
     },
-    "total": 765.3132163070001,
     "count": 1,
-    "self": 0.5930619870000555,
     "children": {
         "run_training.setup": {
-            "total": 0.03710776100001567,
             "count": 1,
-            "self": 0.03710776100001567
         },
         "TrainerController.start_learning": {
-            "total": 764.683046559,
             "count": 1,
-            "self": 0.949189137989606,
             "children": {
                 "TrainerController._reset_env": {
-                    "total": 3.585462923000023,
                     "count": 1,
-                    "self": 3.585462923000023
                 },
                 "TrainerController.advance": {
-                    "total": 760.0062615160103,
-                    "count": 18208,
-                    "self": 0.42497787501986295,
                     "children": {
                         "env_step": {
-                            "total": 759.5812836409905,
-                            "count": 18208,
-                            "self": 602.27683737699,
                             "children": {
                                 "SubprocessEnvManager._take_step": {
-                                    "total": 156.8676528189999,
-                                    "count": 18208,
-                                    "self": 2.4283309699890196,
                                     "children": {
                                         "TorchPolicy.evaluate": {
-                                            "total": 154.43932184901087,
-                                            "count": 18208,
-                                            "self": 154.43932184901087
                                         }
                                     }
                                 },
                                 "workers": {
-                                    "total": 0.43679344500060324,
-                                    "count": 18208,
                                     "self": 0.0,
                                     "children": {
                                         "worker_root": {
-                                            "total": 762.6161606029825,
-                                            "count": 18208,
                                             "is_parallel": true,
-                                            "self": 438.6304640459622,
                                             "children": {
                                                 "run_training.setup": {
                                                     "total": 0.0,
@@ -217,48 +217,48 @@
                                                     "self": 0.0,
                                                     "children": {
                                                         "steps_from_proto": {
-                                                            "total": 0.007090471999958936,
                                                             "count": 1,
                                                             "is_parallel": true,
-                                                            "self": 0.004857103999938772,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
-                                                                    "total": 0.002233368000020164,
                                                                     "count": 10,
                                                                     "is_parallel": true,
-                                                                    "self": 0.002233368000020164
                                                                 }
                                                             }
                                                         },
                                                         "UnityEnvironment.step": {
-                                                            "total": 0.04775891999997839,
                                                             "count": 1,
                                                             "is_parallel": true,
-                                                            "self": 0.0008827899999914735,
                                                             "children": {
                                                                 "UnityEnvironment._generate_step_input": {
-                                                                    "total": 0.00045350200002758356,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.00045350200002758356
                                                                 },
                                                                 "communicator.exchange": {
-                                                                    "total": 0.04406474100005653,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.04406474100005653
                                                                 },
                                                                 "steps_from_proto": {
-                                                                    "total": 0.002357886999902803,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.0004984689996945235,
                                                                     "children": {
                                                                         "_process_rank_one_or_two_observation": {
-                                                                            "total": 0.0018594180002082794,
                                                                             "count": 10,
                                                                             "is_parallel": true,
-                                                                            "self": 0.0018594180002082794
                                                                         }
                                                                     }
                                                                 }
@@ -267,34 +267,34 @@
                                                     }
                                                 },
                                                 "UnityEnvironment.step": {
-                                                    "total": 323.98569655702033,
-                                                    "count": 18207,
                                                     "is_parallel": true,
-                                                    "self": 13.650050263036519,
                                                     "children": {
                                                         "UnityEnvironment._generate_step_input": {
-                                                            "total": 7.71489115998736,
-                                                            "count": 18207,
                                                             "is_parallel": true,
-                                                            "self": 7.71489115998736
                                                         },
                                                         "communicator.exchange": {
-                                                            "total": 259.3493254720022,
-                                                            "count": 18207,
                                                             "is_parallel": true,
-                                                            "self": 259.3493254720022
                                                         },
                                                         "steps_from_proto": {
-                                                            "total": 43.27142966199426,
-                                                            "count": 18207,
                                                             "is_parallel": true,
-                                                            "self": 8.577398599008802,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
-                                                                    "total": 34.69403106298546,
-                                                                    "count": 182070,
                                                                     "is_parallel": true,
-                                                                    "self": 34.69403106298546
                                                                 }
                                                             }
                                                         }
@@ -309,9 +309,9 @@
                     }
                 },
                 "trainer_threads": {
-                    "total": 0.000221620000047551,
                     "count": 1,
-                    "self": 0.000221620000047551,
                     "children": {
                         "thread_root": {
                             "total": 0.0,
@@ -320,36 +320,36 @@
                             "self": 0.0,
                             "children": {
                                 "trainer_advance": {
-                                    "total": 753.5991227619644,
-                                    "count": 760786,
                                     "is_parallel": true,
-                                    "self": 17.114075343134118,
                                     "children": {
                                         "process_trajectory": {
-                                            "total": 338.4741784408303,
-                                            "count": 760786,
                                             "is_parallel": true,
-                                            "self": 337.1586647528302,
                                             "children": {
                                                 "RLTrainer._checkpoint": {
-                                                    "total": 1.3155136880001237,
                                                     "count": 4,
                                                     "is_parallel": true,
-                                                    "self": 1.3155136880001237
                                                 }
                                             }
                                         },
                                         "_update_policy": {
-                                            "total": 398.01086897799996,
                                             "count": 90,
                                             "is_parallel": true,
-                                            "self": 97.17286447700337,
                                             "children": {
                                                 "TorchPPOOptimizer.update": {
-                                                    "total": 300.8380045009966,
                                                     "count": 1800,
                                                     "is_parallel": true,
-                                                    "self": 300.8380045009966
                                                 }
                                             }
                                         }
@@ -360,14 +360,14 @@
                     }
                 },
                 "TrainerController._save_models": {
-                    "total": 0.14191136199997345,
                     "count": 1,
-                    "self": 0.007087764000061725,
                     "children": {
                         "RLTrainer._checkpoint": {
-                            "total": 0.13482359799991173,
                             "count": 1,
-                            "self": 0.13482359799991173
                         }
                     }
                 }

     "name": "root",
     "gauges": {
         "SnowballTarget.Policy.Entropy.mean": {
+            "value": 0.6928920745849609,
+            "min": 0.6928920745849609,
+            "max": 2.878577470779419,
             "count": 20
         },
         "SnowballTarget.Policy.Entropy.sum": {
+            "value": 6646.220703125,
+            "min": 6646.220703125,
+            "max": 29574.50390625,
             "count": 20
         },
         "SnowballTarget.Step.mean": {
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
+            "value": 11.981770515441895,
+            "min": 0.29059553146362305,
+            "max": 11.981770515441895,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
+            "value": 2336.4453125,
+            "min": 56.37553405761719,
+            "max": 2440.07568359375,
             "count": 20
         },
         "SnowballTarget.Environment.EpisodeLength.mean": {
             "count": 20
         },
         "SnowballTarget.Losses.PolicyLoss.mean": {
+            "value": 0.0296454241455649,
+            "min": 0.028084085073787724,
+            "max": 0.037452506452100354,
             "count": 20
         },
         "SnowballTarget.Losses.PolicyLoss.sum": {
+            "value": 0.1185816965822596,
+            "min": 0.1185816965822596,
+            "max": 0.18726253226050177,
             "count": 20
         },
         "SnowballTarget.Losses.ValueLoss.mean": {
+            "value": 0.19328838884830474,
+            "min": 0.10373825123533606,
+            "max": 0.290578506141901,
             "count": 20
         },
         "SnowballTarget.Losses.ValueLoss.sum": {
+            "value": 0.773153555393219,
+            "min": 0.41495300494134424,
+            "max": 1.3859055444598198,
             "count": 20
         },
         "SnowballTarget.Policy.LearningRate.mean": {
         "SnowballTarget.Policy.LearningRate.sum": {
             "value": 4.310438922400004e-05,
             "min": 4.310438922400004e-05,
+            "max": 0.0018468800382800002,
             "count": 20
         },
         "SnowballTarget.Policy.Epsilon.mean": {
         "SnowballTarget.Policy.Epsilon.sum": {
             "value": 0.421552,
             "min": 0.421552,
+            "max": 1.42344,
             "count": 20
         },
         "SnowballTarget.Policy.Beta.mean": {
         "SnowballTarget.Policy.Beta.sum": {
             "value": 0.0005777224000000006,
             "min": 0.0005777224000000006,
+            "max": 0.023089828,
             "count": 20
         },
         "SnowballTarget.Environment.CumulativeReward.mean": {
+            "value": 23.681818181818183,
+            "min": 2.6818181818181817,
+            "max": 23.70909090909091,
             "count": 20
         },
         "SnowballTarget.Environment.CumulativeReward.sum": {
+            "value": 1042.0,
+            "min": 118.0,
+            "max": 1304.0,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicReward.mean": {
+            "value": 23.681818181818183,
+            "min": 2.6818181818181817,
+            "max": 23.70909090909091,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicReward.sum": {
+            "value": 1042.0,
+            "min": 118.0,
+            "max": 1304.0,
             "count": 20
         },
         "SnowballTarget.IsTraining.mean": {
     },
     "metadata": {
         "timer_format_version": "0.1.0",
+        "start_time_seconds": "1738662694",
         "python_version": "3.10.12 (main, Jul  5 2023, 18:54:27) [GCC 11.2.0]",
+        "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTargetXenjin450 --no-graphics",
         "mlagents_version": "1.2.0.dev0",
         "mlagents_envs_version": "1.2.0.dev0",
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "2.6.0+cu124",
         "numpy_version": "1.23.5",
+        "end_time_seconds": "1738663506"
     },
+    "total": 812.5668383210004,
     "count": 1,
+    "self": 0.6927915620008207,
     "children": {
         "run_training.setup": {
+            "total": 0.03452016699975502,
             "count": 1,
+            "self": 0.03452016699975502
         },
         "TrainerController.start_learning": {
+            "total": 811.8395265919999,
             "count": 1,
+            "self": 1.07995954297985,
             "children": {
                 "TrainerController._reset_env": {
+                    "total": 3.42389432499931,
                     "count": 1,
+                    "self": 3.42389432499931
                 },
                 "TrainerController.advance": {
+                    "total": 807.1814257440201,
+                    "count": 18206,
+                    "self": 0.49803600401173753,
                     "children": {
                         "env_step": {
+                            "total": 806.6833897400084,
+                            "count": 18206,
+                            "self": 640.9386373739844,
                             "children": {
                                 "SubprocessEnvManager._take_step": {
+                                    "total": 165.25657096709983,
+                                    "count": 18206,
+                                    "self": 2.93720667904563,
                                     "children": {
                                         "TorchPolicy.evaluate": {
+                                            "total": 162.3193642880542,
+                                            "count": 18206,
+                                            "self": 162.3193642880542
                                         }
                                     }
                                 },
                                 "workers": {
+                                    "total": 0.4881813989240982,
+                                    "count": 18206,
                                     "self": 0.0,
                                     "children": {
                                         "worker_root": {
+                                            "total": 809.5793749020659,
+                                            "count": 18206,
                                             "is_parallel": true,
+                                            "self": 463.8940645060702,
                                             "children": {
                                                 "run_training.setup": {
                                                     "total": 0.0,
                                                     "self": 0.0,
                                                     "children": {
                                                         "steps_from_proto": {
+                                                            "total": 0.004620794999937061,
                                                             "count": 1,
                                                             "is_parallel": true,
+                                                            "self": 0.001583236999977089,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
+                                                                    "total": 0.0030375579999599722,
                                                                     "count": 10,
                                                                     "is_parallel": true,
+                                                                    "self": 0.0030375579999599722
                                                                 }
                                                             }
                                                         },
                                                         "UnityEnvironment.step": {
+                                                            "total": 0.15677927999968233,
                                                             "count": 1,
                                                             "is_parallel": true,
+                                                            "self": 0.0037805080000907765,
                                                             "children": {
                                                                 "UnityEnvironment._generate_step_input": {
+                                                                    "total": 0.0004818150000573951,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.0004818150000573951
                                                                 },
                                                                 "communicator.exchange": {
+                                                                    "total": 0.13114621299973805,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.13114621299973805
                                                                 },
                                                                 "steps_from_proto": {
+                                                                    "total": 0.021370743999796105,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.005355924999093986,
                                                                     "children": {
                                                                         "_process_rank_one_or_two_observation": {
+                                                                            "total": 0.01601481900070212,
                                                                             "count": 10,
                                                                             "is_parallel": true,
+                                                                            "self": 0.01601481900070212
                                                                         }
                                                                     }
                                                                 }
                                                     }
                                                 },
                                                 "UnityEnvironment.step": {
+                                                    "total": 345.68531039599566,
+                                                    "count": 18205,
                                                     "is_parallel": true,
+                                                    "self": 14.406276040003831,
                                                     "children": {
                                                         "UnityEnvironment._generate_step_input": {
+                                                            "total": 7.994227226001385,
+                                                            "count": 18205,
                                                             "is_parallel": true,
+                                                            "self": 7.994227226001385
                                                         },
                                                         "communicator.exchange": {
+                                                            "total": 278.1204304049734,
+                                                            "count": 18205,
                                                             "is_parallel": true,
+                                                            "self": 278.1204304049734
                                                         },
                                                         "steps_from_proto": {
+                                                            "total": 45.164376725017064,
+                                                            "count": 18205,
                                                             "is_parallel": true,
+                                                            "self": 9.234507885953462,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
+                                                                    "total": 35.9298688390636,
+                                                                    "count": 182050,
                                                                     "is_parallel": true,
+                                                                    "self": 35.9298688390636
                                                                 }
                                                             }
                                                         }
                     }
                 },
                 "trainer_threads": {
+                    "total": 0.00023182800032373052,
                     "count": 1,
+                    "self": 0.00023182800032373052,
                     "children": {
                         "thread_root": {
                             "total": 0.0,
                             "self": 0.0,
                             "children": {
                                 "trainer_advance": {
+                                    "total": 800.2991470469851,
+                                    "count": 828679,
                                     "is_parallel": true,
+                                    "self": 18.937228551389126,
                                     "children": {
                                         "process_trajectory": {
+                                            "total": 362.3103792215943,
+                                            "count": 828679,
                                             "is_parallel": true,
+                                            "self": 360.76179730759395,
                                             "children": {
                                                 "RLTrainer._checkpoint": {
+                                                    "total": 1.5485819140003514,
                                                     "count": 4,
                                                     "is_parallel": true,
+                                                    "self": 1.5485819140003514
                                                 }
                                             }
                                         },
                                         "_update_policy": {
+                                            "total": 419.0515392740017,
                                             "count": 90,
                                             "is_parallel": true,
+                                            "self": 98.93746979500156,
                                             "children": {
                                                 "TorchPPOOptimizer.update": {
+                                                    "total": 320.11406947900014,
                                                     "count": 1800,
                                                     "is_parallel": true,
+                                                    "self": 320.11406947900014
                                                 }
                                             }
                                         }
                     }
                 },
                 "TrainerController._save_models": {
+                    "total": 0.1540151520002837,
                     "count": 1,
+                    "self": 0.004700188000242633,
                     "children": {
                         "RLTrainer._checkpoint": {
+                            "total": 0.14931496400004107,
                             "count": 1,
+                            "self": 0.14931496400004107
                         }
                     }
                 }

run_logs/training_status.json CHANGED Viewed

@@ -3,57 +3,57 @@
         "checkpoints": [
             {
                 "steps": 49936,
-                "file_path": "results/SnowballTargetRLXenjin450/SnowballTarget/SnowballTarget-49936.onnx",
-                "reward": 18.545454545454547,
-                "creation_time": 1738656745.9923544,
                 "auxillary_file_paths": [
-                    "results/SnowballTargetRLXenjin450/SnowballTarget/SnowballTarget-49936.pt"
                 ]
             },
             {
                 "steps": 99960,
-                "file_path": "results/SnowballTargetRLXenjin450/SnowballTarget/SnowballTarget-99960.onnx",
-                "reward": 25.181818181818183,
-                "creation_time": 1738656933.7699564,
                 "auxillary_file_paths": [
-                    "results/SnowballTargetRLXenjin450/SnowballTarget/SnowballTarget-99960.pt"
                 ]
             },
             {
                 "steps": 149984,
-                "file_path": "results/SnowballTargetRLXenjin450/SnowballTarget/SnowballTarget-149984.onnx",
-                "reward": 26.09090909090909,
-                "creation_time": 1738657127.274378,
                 "auxillary_file_paths": [
-                    "results/SnowballTargetRLXenjin450/SnowballTarget/SnowballTarget-149984.pt"
                 ]
             },
             {
                 "steps": 199984,
-                "file_path": "results/SnowballTargetRLXenjin450/SnowballTarget/SnowballTarget-199984.onnx",
-                "reward": 26.363636363636363,
-                "creation_time": 1738657315.1212382,
                 "auxillary_file_paths": [
-                    "results/SnowballTargetRLXenjin450/SnowballTarget/SnowballTarget-199984.pt"
                 ]
             },
             {
                 "steps": 200112,
-                "file_path": "results/SnowballTargetRLXenjin450/SnowballTarget/SnowballTarget-200112.onnx",
-                "reward": 26.363636363636363,
-                "creation_time": 1738657315.280354,
                 "auxillary_file_paths": [
-                    "results/SnowballTargetRLXenjin450/SnowballTarget/SnowballTarget-200112.pt"
                 ]
             }
         ],
         "final_checkpoint": {
             "steps": 200112,
-            "file_path": "results/SnowballTargetRLXenjin450/SnowballTarget.onnx",
-            "reward": 26.363636363636363,
-            "creation_time": 1738657315.280354,
             "auxillary_file_paths": [
-                "results/SnowballTargetRLXenjin450/SnowballTarget/SnowballTarget-200112.pt"
             ]
         }
     },

         "checkpoints": [
             {
                 "steps": 49936,
+                "file_path": "results/SnowballTargetXenjin450/SnowballTarget/SnowballTarget-49936.onnx",
+                "reward": 13.636363636363637,
+                "creation_time": 1738662894.4801404,
                 "auxillary_file_paths": [
+                    "results/SnowballTargetXenjin450/SnowballTarget/SnowballTarget-49936.pt"
                 ]
             },
             {
                 "steps": 99960,
+                "file_path": "results/SnowballTargetXenjin450/SnowballTarget/SnowballTarget-99960.onnx",
+                "reward": 22.727272727272727,
+                "creation_time": 1738663097.372155,
                 "auxillary_file_paths": [
+                    "results/SnowballTargetXenjin450/SnowballTarget/SnowballTarget-99960.pt"
                 ]
             },
             {
                 "steps": 149984,
+                "file_path": "results/SnowballTargetXenjin450/SnowballTarget/SnowballTarget-149984.onnx",
+                "reward": 24.09090909090909,
+                "creation_time": 1738663302.5231082,
                 "auxillary_file_paths": [
+                    "results/SnowballTargetXenjin450/SnowballTarget/SnowballTarget-149984.pt"
                 ]
             },
             {
                 "steps": 199984,
+                "file_path": "results/SnowballTargetXenjin450/SnowballTarget/SnowballTarget-199984.onnx",
+                "reward": 23.90909090909091,
+                "creation_time": 1738663506.0177546,
                 "auxillary_file_paths": [
+                    "results/SnowballTargetXenjin450/SnowballTarget/SnowballTarget-199984.pt"
                 ]
             },
             {
                 "steps": 200112,
+                "file_path": "results/SnowballTargetXenjin450/SnowballTarget/SnowballTarget-200112.onnx",
+                "reward": 23.90909090909091,
+                "creation_time": 1738663506.209956,
                 "auxillary_file_paths": [
+                    "results/SnowballTargetXenjin450/SnowballTarget/SnowballTarget-200112.pt"
                 ]
             }
         ],
         "final_checkpoint": {
             "steps": 200112,
+            "file_path": "results/SnowballTargetXenjin450/SnowballTarget.onnx",
+            "reward": 23.90909090909091,
+            "creation_time": 1738663506.209956,
             "auxillary_file_paths": [
+                "results/SnowballTargetXenjin450/SnowballTarget/SnowballTarget-200112.pt"
             ]
         }
     },