jensenwiedler commited on Jan 4, 2025

Commit

faad574

verified ·

1 Parent(s): 2a7d5f0

second Push

Browse files

Files changed (18) hide show

SnowballTarget.onnx +1 -1
SnowballTarget/SnowballTarget-549976.onnx +3 -0
SnowballTarget/SnowballTarget-549976.pt +3 -0
SnowballTarget/SnowballTarget-599936.onnx +3 -0
SnowballTarget/SnowballTarget-599936.pt +3 -0
SnowballTarget/SnowballTarget-649960.onnx +3 -0
SnowballTarget/SnowballTarget-649960.pt +3 -0
SnowballTarget/SnowballTarget-699960.onnx +3 -0
SnowballTarget/SnowballTarget-699960.pt +3 -0
SnowballTarget/SnowballTarget-700216.onnx +3 -0
SnowballTarget/SnowballTarget-700216.pt +3 -0
SnowballTarget/checkpoint.pt +1 -1
SnowballTarget/events.out.tfevents.1735996792.358412b7f1d5.7231.0 +3 -0
config.json +1 -1
configuration.yaml +2 -2
run_logs/Player-0.log +15 -15
run_logs/timers.json +163 -163
run_logs/training_status.json +49 -49

SnowballTarget.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:892ed4663f040154610c0c27bd9130771b3ed591703db9df3e2189faa84fad5a
 size 650646

 version https://git-lfs.github.com/spec/v1
+oid sha256:b69b5713932148c7adb707222b68501899ba0abfabdd2aa1f7e8e634ff7a76b3
 size 650646

SnowballTarget/SnowballTarget-549976.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:763f3c90d1ea2173ad1e8346c2902f1bd8ba3bca3b050f0e7f2c120edc9ba04d
+size 650646

SnowballTarget/SnowballTarget-549976.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c0cbef37288d8a771abbab0f090b9106e133226b480e46cf2cd65590cb0fce24
+size 3850075

SnowballTarget/SnowballTarget-599936.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:91ee899f60a7b2a091715d5dd6765a75e99e5a1d930a6244cd5c6a100585c1e7
+size 650646

SnowballTarget/SnowballTarget-599936.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c436d411c6726b248971025e4aa5280e43f0982b68ecd9d88c628530f696e7be
+size 3850075

SnowballTarget/SnowballTarget-649960.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:af897a4d6fab3b15fff12d12ab64098100035b52053bf6d9fe41a0a271c6736d
+size 650646

SnowballTarget/SnowballTarget-649960.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8e54d611dc1e30d983999d0b25eb2e76ae481bafb3b0bf4140a73de6054c7f9d
+size 3850075

SnowballTarget/SnowballTarget-699960.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b69b5713932148c7adb707222b68501899ba0abfabdd2aa1f7e8e634ff7a76b3
+size 650646

SnowballTarget/SnowballTarget-699960.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:22ea085092fde13684e0a92448a989c323b7f2e672eb46ac179a5a6681ec3e19
+size 3850075

SnowballTarget/SnowballTarget-700216.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b69b5713932148c7adb707222b68501899ba0abfabdd2aa1f7e8e634ff7a76b3
+size 650646

SnowballTarget/SnowballTarget-700216.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d9b5d76fb6eb643b312825282fd710ee75c8d7f79eb4635d5e19bc4507f2d8d2
+size 3850075

SnowballTarget/checkpoint.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5ff7571f7515972757077b49f5ca68bfdcf48c2362cdf55d7ffbeaa9e7062423
 size 3849250

 version https://git-lfs.github.com/spec/v1
+oid sha256:6d6e73e62c0552157b38d2b0afa307cca1fa485ff46f2c555b25fd1007211ad2
 size 3849250

SnowballTarget/events.out.tfevents.1735996792.358412b7f1d5.7231.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:10b3f974537bd9824da4e8e4673eb78f54745ba729906091836d90ebb2884ba0
+size 17436

config.json CHANGED Viewed

@@ -1 +1 @@

- {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 512, "buffer_size": 10240, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 50000, "network_settings": {"normalize": false, "hidden_units": 256, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "even_checkpoints": false, "max_steps": ~~500000~~, "time_horizon": 64, "summary_freq": 10000, "threaded": false, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SnowballTarget/SnowballTarget", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SnowballTarget2", "initialize_from": null, "load_model": false, "resume": ~~false~~, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

+ {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 512, "buffer_size": 10240, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 50000, "network_settings": {"normalize": false, "hidden_units": 256, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "even_checkpoints": false, "max_steps": 700000, "time_horizon": 64, "summary_freq": 10000, "threaded": false, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SnowballTarget/SnowballTarget", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SnowballTarget2", "initialize_from": null, "load_model": false, "resume": true, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

configuration.yaml CHANGED Viewed

@@ -38,7 +38,7 @@ behaviors:
     init_path: null
     keep_checkpoints: 10
     even_checkpoints: false
-    max_steps: 500000
     time_horizon: 64
     summary_freq: 10000
     threaded: false
@@ -69,7 +69,7 @@ checkpoint_settings:
   run_id: SnowballTarget2
   initialize_from: null
   load_model: false
-  resume: false
   force: false
   train_model: false
   inference: false

     init_path: null
     keep_checkpoints: 10
     even_checkpoints: false
+    max_steps: 700000
     time_horizon: 64
     summary_freq: 10000
     threaded: false
   run_id: SnowballTarget2
   initialize_from: null
   load_model: false
+  resume: true
   force: false
   train_model: false
   inference: false

run_logs/Player-0.log CHANGED Viewed

@@ -31,7 +31,7 @@ ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM default
 FMOD failed to initialize the output device.: "Error initializing output device. " (60)
 FMOD initialized on nosound output
 Begin MonoManager ReloadAssembly
-- Completed reload, in  0.084 seconds
 ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
@@ -42,7 +42,7 @@ ERROR: Shader Standard shader is not supported on this GPU (none of subshaders/f
 WARNING: Shader Unsupported: 'Standard' - All subshaders removed
 WARNING: Shader Did you use #pragma only_renderers and omit this platform?
 WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
-UnloadTime: 0.600158 ms
 ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 requesting resize 84 x 84
 Setting up 1 worker threads for Enlighten.
@@ -50,7 +50,7 @@ Memory Statistics:
 [ALLOC_TEMP_TLS] TLS Allocator
   StackAllocators :
     [ALLOC_TEMP_MAIN]
-      Peak usage frame count: [8.0 KB-16.0 KB]: 13412 frames, [16.0 KB-32.0 KB]: 227 frames, [2.0 MB-4.0 MB]: 1 frames
       Initial Block Size 4.0 MB
       Current Block Size 4.0 MB
       Peak Allocated Bytes 2.0 MB
@@ -166,22 +166,22 @@ Memory Statistics:
       Peak Allocated Bytes 0 B
       Overflow Count 0
 [ALLOC_DEFAULT] Dual Thread Allocator
-  Peak main deferred allocation count 44
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_DEFAULT_MAIN]
-      Peak usage frame count: [4.0 MB-8.0 MB]: 12691 frames, [8.0 MB-16.0 MB]: 949 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
-      Peak Allocated memory 9.5 MB
       Peak Large allocation bytes 0 B
     [ALLOC_DEFAULT_THREAD]
-      Peak usage frame count: [16.0 MB-32.0 MB]: 13640 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
-      Peak Allocated memory 17.9 MB
       Peak Large allocation bytes 16.0 MB
 [ALLOC_TEMP_JOB_1_FRAME]
   Initial Block Size 2.0 MB
@@ -210,13 +210,13 @@ Memory Statistics:
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_GFX_MAIN]
-      Peak usage frame count: [32.0 KB-64.0 KB]: 9992 frames, [64.0 KB-128.0 KB]: 3648 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
-      Peak Allocated memory 67.7 KB
       Peak Large allocation bytes 0 B
     [ALLOC_GFX_THREAD]
-      Peak usage frame count: [32.0 KB-64.0 KB]: 13640 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 39.6 KB
@@ -228,13 +228,13 @@ Memory Statistics:
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_CACHEOBJECTS_MAIN]
-      Peak usage frame count: [0.5 MB-1.0 MB]: 13640 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 0.6 MB
       Peak Large allocation bytes 0 B
     [ALLOC_CACHEOBJECTS_THREAD]
-      Peak usage frame count: [0.5 MB-1.0 MB]: 13639 frames, [2.0 MB-4.0 MB]: 1 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 2.2 MB
@@ -246,13 +246,13 @@ Memory Statistics:
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_TYPETREE_MAIN]
-      Peak usage frame count: [0-1.0 KB]: 13640 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.0 KB
       Peak Large allocation bytes 0 B
     [ALLOC_TYPETREE_THREAD]
-      Peak usage frame count: [1.0 KB-2.0 KB]: 13640 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.7 KB

 FMOD failed to initialize the output device.: "Error initializing output device. " (60)
 FMOD initialized on nosound output
 Begin MonoManager ReloadAssembly
+- Completed reload, in  0.085 seconds
 ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 WARNING: Shader Unsupported: 'Standard' - All subshaders removed
 WARNING: Shader Did you use #pragma only_renderers and omit this platform?
 WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
+UnloadTime: 0.690879 ms
 ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 requesting resize 84 x 84
 Setting up 1 worker threads for Enlighten.
 [ALLOC_TEMP_TLS] TLS Allocator
   StackAllocators :
     [ALLOC_TEMP_MAIN]
+      Peak usage frame count: [8.0 KB-16.0 KB]: 5367 frames, [16.0 KB-32.0 KB]: 90 frames, [2.0 MB-4.0 MB]: 1 frames
       Initial Block Size 4.0 MB
       Current Block Size 4.0 MB
       Peak Allocated Bytes 2.0 MB
       Peak Allocated Bytes 0 B
       Overflow Count 0
 [ALLOC_DEFAULT] Dual Thread Allocator
+  Peak main deferred allocation count 36
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_DEFAULT_MAIN]
+      Peak usage frame count: [4.0 MB-8.0 MB]: 5458 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
+      Peak Allocated memory 6.8 MB
       Peak Large allocation bytes 0 B
     [ALLOC_DEFAULT_THREAD]
+      Peak usage frame count: [16.0 MB-32.0 MB]: 5458 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
+      Peak Allocated memory 17.7 MB
       Peak Large allocation bytes 16.0 MB
 [ALLOC_TEMP_JOB_1_FRAME]
   Initial Block Size 2.0 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_GFX_MAIN]
+      Peak usage frame count: [32.0 KB-64.0 KB]: 5263 frames, [64.0 KB-128.0 KB]: 195 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
+      Peak Allocated memory 66.0 KB
       Peak Large allocation bytes 0 B
     [ALLOC_GFX_THREAD]
+      Peak usage frame count: [32.0 KB-64.0 KB]: 5458 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 39.6 KB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_CACHEOBJECTS_MAIN]
+      Peak usage frame count: [0.5 MB-1.0 MB]: 5458 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 0.6 MB
       Peak Large allocation bytes 0 B
     [ALLOC_CACHEOBJECTS_THREAD]
+      Peak usage frame count: [0.5 MB-1.0 MB]: 5457 frames, [2.0 MB-4.0 MB]: 1 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 2.2 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_TYPETREE_MAIN]
+      Peak usage frame count: [0-1.0 KB]: 5458 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.0 KB
       Peak Large allocation bytes 0 B
     [ALLOC_TYPETREE_THREAD]
+      Peak usage frame count: [1.0 KB-2.0 KB]: 5458 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.7 KB

run_logs/timers.json CHANGED Viewed

@@ -2,213 +2,213 @@
     "name": "root",
     "gauges": {
         "SnowballTarget.Policy.Entropy.mean": {
-            "value": 1.0433436632156372,
-            "min": 1.0433436632156372,
-            "max": 2.8903353214263916,
-            "count": 50
         },
         "SnowballTarget.Policy.Entropy.sum": {
-            "value": 10007.7529296875,
-            "min": 10007.7529296875,
-            "max": 29582.12109375,
-            "count": 50
         },
         "SnowballTarget.Step.mean": {
-            "value": 499976.0,
-            "min": 9952.0,
-            "max": 499976.0,
-            "count": 50
         },
         "SnowballTarget.Step.sum": {
-            "value": 499976.0,
-            "min": 9952.0,
-            "max": 499976.0,
-            "count": 50
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
-            "value": 11.941898345947266,
-            "min": -0.029164781793951988,
-            "max": 11.941898345947266,
-            "count": 50
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
-            "value": 2448.089111328125,
-            "min": -5.657967567443848,
-            "max": 2448.089111328125,
-            "count": 50
         },
         "SnowballTarget.Environment.EpisodeLength.mean": {
             "value": 199.0,
             "min": 199.0,
             "max": 199.0,
-            "count": 50
         },
         "SnowballTarget.Environment.EpisodeLength.sum": {
-            "value": 10945.0,
             "min": 8756.0,
             "max": 10945.0,
-            "count": 50
         },
         "SnowballTarget.Environment.CumulativeReward.mean": {
-            "value": 24.836363636363636,
-            "min": 2.772727272727273,
-            "max": 24.836363636363636,
-            "count": 50
         },
         "SnowballTarget.Environment.CumulativeReward.sum": {
-            "value": 1366.0,
-            "min": 122.0,
-            "max": 1366.0,
-            "count": 50
         },
         "SnowballTarget.Policy.ExtrinsicReward.mean": {
-            "value": 24.836363636363636,
-            "min": 2.772727272727273,
-            "max": 24.836363636363636,
-            "count": 50
         },
         "SnowballTarget.Policy.ExtrinsicReward.sum": {
-            "value": 1366.0,
-            "min": 122.0,
-            "max": 1366.0,
-            "count": 50
         },
         "SnowballTarget.IsTraining.mean": {
             "value": 1.0,
             "min": 1.0,
             "max": 1.0,
-            "count": 50
         },
         "SnowballTarget.IsTraining.sum": {
             "value": 1.0,
             "min": 1.0,
             "max": 1.0,
-            "count": 50
         },
         "SnowballTarget.Losses.PolicyLoss.mean": {
-            "value": 0.033749266809597125,
-            "min": 0.029031308105451955,
-            "max": 0.04455755887320265,
-            "count": 47
         },
         "SnowballTarget.Losses.PolicyLoss.sum": {
-            "value": 0.033749266809597125,
-            "min": 0.029031308105451955,
-            "max": 0.04455755887320265,
-            "count": 47
         },
         "SnowballTarget.Losses.ValueLoss.mean": {
-            "value": 0.21887490873535473,
-            "min": 0.09664271038676066,
-            "max": 0.29807205746571225,
-            "count": 47
         },
         "SnowballTarget.Losses.ValueLoss.sum": {
-            "value": 0.21887490873535473,
-            "min": 0.09664271038676066,
-            "max": 0.29807205746571225,
-            "count": 47
         },
         "SnowballTarget.Policy.LearningRate.mean": {
-            "value": 5.21769826079999e-06,
-            "min": 5.21769826079999e-06,
-            "max": 0.00029345280218239997,
-            "count": 47
         },
         "SnowballTarget.Policy.LearningRate.sum": {
-            "value": 5.21769826079999e-06,
-            "min": 5.21769826079999e-06,
-            "max": 0.00029345280218239997,
-            "count": 47
         },
         "SnowballTarget.Policy.Epsilon.mean": {
-            "value": 0.1017392,
-            "min": 0.1017392,
-            "max": 0.19781760000000007,
-            "count": 47
         },
         "SnowballTarget.Policy.Epsilon.sum": {
-            "value": 0.1017392,
-            "min": 0.1017392,
-            "max": 0.19781760000000007,
-            "count": 47
         },
         "SnowballTarget.Policy.Beta.mean": {
-            "value": 9.678607999999981e-05,
-            "min": 9.678607999999981e-05,
-            "max": 0.004891098240000002,
-            "count": 47
         },
         "SnowballTarget.Policy.Beta.sum": {
-            "value": 9.678607999999981e-05,
-            "min": 9.678607999999981e-05,
-            "max": 0.004891098240000002,
-            "count": 47
         }
     },
     "metadata": {
         "timer_format_version": "0.1.0",
-        "start_time_seconds": "1735995543",
         "python_version": "3.10.12 (main, Nov  6 2024, 20:22:13) [GCC 11.4.0]",
-        "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget2 --no-graphics",
         "mlagents_version": "1.2.0.dev0",
         "mlagents_envs_version": "1.2.0.dev0",
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "2.5.1+cu121",
         "numpy_version": "1.23.5",
-        "end_time_seconds": "1735996536"
     },
-    "total": 993.28940263,
     "count": 1,
-    "self": 0.4245706540000356,
     "children": {
         "run_training.setup": {
-            "total": 0.056337170000006154,
             "count": 1,
-            "self": 0.056337170000006154
         },
         "TrainerController.start_learning": {
-            "total": 992.808494806,
             "count": 1,
-            "self": 0.9585018079978909,
             "children": {
                 "TrainerController._reset_env": {
-                    "total": 1.9245968129999937,
                     "count": 1,
-                    "self": 1.9245968129999937
                 },
                 "TrainerController.advance": {
-                    "total": 989.8385282080022,
-                    "count": 45464,
-                    "self": 0.9712684860089666,
                     "children": {
                         "env_step": {
-                            "total": 774.9790556860028,
-                            "count": 45464,
-                            "self": 590.8048344499957,
                             "children": {
                                 "SubprocessEnvManager._take_step": {
-                                    "total": 183.58603823599964,
-                                    "count": 45464,
-                                    "self": 3.256037505008635,
                                     "children": {
                                         "TorchPolicy.evaluate": {
-                                            "total": 180.330000730991,
-                                            "count": 45464,
-                                            "self": 180.330000730991
                                         }
                                     }
                                 },
                                 "workers": {
-                                    "total": 0.5881830000073478,
-                                    "count": 45464,
                                     "self": 0.0,
                                     "children": {
                                         "worker_root": {
-                                            "total": 989.5127421100162,
-                                            "count": 45464,
                                             "is_parallel": true,
-                                            "self": 472.04015061402083,
                                             "children": {
                                                 "run_training.setup": {
                                                     "total": 0.0,
@@ -217,48 +217,48 @@
                                                     "self": 0.0,
                                                     "children": {
                                                         "steps_from_proto": {
-                                                            "total": 0.0027205869999988863,
                                                             "count": 1,
                                                             "is_parallel": true,
-                                                            "self": 0.0008482860000640358,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
-                                                                    "total": 0.0018723009999348506,
                                                                     "count": 10,
                                                                     "is_parallel": true,
-                                                                    "self": 0.0018723009999348506
                                                                 }
                                                             }
                                                         },
                                                         "UnityEnvironment.step": {
-                                                            "total": 0.035676571000010426,
                                                             "count": 1,
                                                             "is_parallel": true,
-                                                            "self": 0.0007358680000493223,
                                                             "children": {
                                                                 "UnityEnvironment._generate_step_input": {
-                                                                    "total": 0.00040279299997791895,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.00040279299997791895
                                                                 },
                                                                 "communicator.exchange": {
-                                                                    "total": 0.03248728099998743,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.03248728099998743
                                                                 },
                                                                 "steps_from_proto": {
-                                                                    "total": 0.0020506289999957517,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.0003799519999461154,
                                                                     "children": {
                                                                         "_process_rank_one_or_two_observation": {
-                                                                            "total": 0.0016706770000496363,
                                                                             "count": 10,
                                                                             "is_parallel": true,
-                                                                            "self": 0.0016706770000496363
                                                                         }
                                                                     }
                                                                 }
@@ -267,34 +267,34 @@
                                                     }
                                                 },
                                                 "UnityEnvironment.step": {
-                                                    "total": 517.4725914959954,
-                                                    "count": 45463,
                                                     "is_parallel": true,
-                                                    "self": 25.08902946298963,
                                                     "children": {
                                                         "UnityEnvironment._generate_step_input": {
-                                                            "total": 13.955431312991777,
-                                                            "count": 45463,
                                                             "is_parallel": true,
-                                                            "self": 13.955431312991777
                                                         },
                                                         "communicator.exchange": {
-                                                            "total": 395.8330503900043,
-                                                            "count": 45463,
                                                             "is_parallel": true,
-                                                            "self": 395.8330503900043
                                                         },
                                                         "steps_from_proto": {
-                                                            "total": 82.5950803300097,
-                                                            "count": 45463,
                                                             "is_parallel": true,
-                                                            "self": 14.943817725006454,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
-                                                                    "total": 67.65126260500324,
-                                                                    "count": 454630,
                                                                     "is_parallel": true,
-                                                                    "self": 67.65126260500324
                                                                 }
                                                             }
                                                         }
@@ -307,31 +307,31 @@
                             }
                         },
                         "trainer_advance": {
-                            "total": 213.8882040359905,
-                            "count": 45464,
-                            "self": 1.0506595439910598,
                             "children": {
                                 "process_trajectory": {
-                                    "total": 73.19176906499933,
-                                    "count": 45464,
-                                    "self": 72.10983122599907,
                                     "children": {
                                         "RLTrainer._checkpoint": {
-                                            "total": 1.0819378390002612,
-                                            "count": 10,
-                                            "self": 1.0819378390002612
                                         }
                                     }
                                 },
                                 "_update_policy": {
-                                    "total": 139.6457754270001,
-                                    "count": 47,
-                                    "self": 96.88497372299588,
                                     "children": {
                                         "TorchPPOOptimizer.update": {
-                                            "total": 42.76080170400422,
-                                            "count": 2856,
-                                            "self": 42.76080170400422
                                         }
                                     }
                                 }
@@ -340,19 +340,19 @@
                     }
                 },
                 "trainer_threads": {
-                    "total": 1.0310000106983352e-06,
                     "count": 1,
-                    "self": 1.0310000106983352e-06
                 },
                 "TrainerController._save_models": {
-                    "total": 0.08686694599987277,
                     "count": 1,
-                    "self": 0.0009152679997441737,
                     "children": {
                         "RLTrainer._checkpoint": {
-                            "total": 0.0859516780001286,
                             "count": 1,
-                            "self": 0.0859516780001286
                         }
                     }
                 }

     "name": "root",
     "gauges": {
         "SnowballTarget.Policy.Entropy.mean": {
+            "value": 0.9545086026191711,
+            "min": 0.9391207695007324,
+            "max": 1.0479693412780762,
+            "count": 20
         },
         "SnowballTarget.Policy.Entropy.sum": {
+            "value": 9743.6240234375,
+            "min": 9086.201171875,
+            "max": 10697.6708984375,
+            "count": 20
         },
         "SnowballTarget.Step.mean": {
+            "value": 699960.0,
+            "min": 509992.0,
+            "max": 699960.0,
+            "count": 20
         },
         "SnowballTarget.Step.sum": {
+            "value": 699960.0,
+            "min": 509992.0,
+            "max": 699960.0,
+            "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
+            "value": 13.043752670288086,
+            "min": 11.944348335266113,
+            "max": 13.043752670288086,
+            "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
+            "value": 2543.53173828125,
+            "min": 2305.25927734375,
+            "max": 2657.7587890625,
+            "count": 20
         },
         "SnowballTarget.Environment.EpisodeLength.mean": {
             "value": 199.0,
             "min": 199.0,
             "max": 199.0,
+            "count": 20
         },
         "SnowballTarget.Environment.EpisodeLength.sum": {
+            "value": 8756.0,
             "min": 8756.0,
             "max": 10945.0,
+            "count": 20
         },
         "SnowballTarget.Environment.CumulativeReward.mean": {
+            "value": 26.068181818181817,
+            "min": 24.795454545454547,
+            "max": 26.204545454545453,
+            "count": 20
         },
         "SnowballTarget.Environment.CumulativeReward.sum": {
+            "value": 1147.0,
+            "min": 1091.0,
+            "max": 1435.0,
+            "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicReward.mean": {
+            "value": 26.068181818181817,
+            "min": 24.795454545454547,
+            "max": 26.204545454545453,
+            "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicReward.sum": {
+            "value": 1147.0,
+            "min": 1091.0,
+            "max": 1435.0,
+            "count": 20
         },
         "SnowballTarget.IsTraining.mean": {
             "value": 1.0,
             "min": 1.0,
             "max": 1.0,
+            "count": 20
         },
         "SnowballTarget.IsTraining.sum": {
             "value": 1.0,
             "min": 1.0,
             "max": 1.0,
+            "count": 20
         },
         "SnowballTarget.Losses.PolicyLoss.mean": {
+            "value": 0.035822989675216375,
+            "min": 0.02571102942974903,
+            "max": 0.042859831821018206,
+            "count": 19
         },
         "SnowballTarget.Losses.PolicyLoss.sum": {
+            "value": 0.035822989675216375,
+            "min": 0.02571102942974903,
+            "max": 0.042859831821018206,
+            "count": 19
         },
         "SnowballTarget.Losses.ValueLoss.mean": {
+            "value": 0.20447064662973086,
+            "min": 0.1857440204374374,
+            "max": 0.22445170631011327,
+            "count": 19
         },
         "SnowballTarget.Losses.ValueLoss.sum": {
+            "value": 0.20447064662973086,
+            "min": 0.1857440204374374,
+            "max": 0.22445170631011327,
+            "count": 19
         },
         "SnowballTarget.Policy.LearningRate.mean": {
+            "value": 5.109569725714209e-07,
+            "min": 5.109569725714209e-07,
+            "max": 8.09932158594286e-05,
+            "count": 19
         },
         "SnowballTarget.Policy.LearningRate.sum": {
+            "value": 5.109569725714209e-07,
+            "min": 5.109569725714209e-07,
+            "max": 8.09932158594286e-05,
+            "count": 19
         },
         "SnowballTarget.Policy.Epsilon.mean": {
+            "value": 0.10017028571428567,
+            "min": 0.10017028571428567,
+            "max": 0.1269977142857143,
+            "count": 19
         },
         "SnowballTarget.Policy.Epsilon.sum": {
+            "value": 0.10017028571428567,
+            "min": 0.10017028571428567,
+            "max": 0.1269977142857143,
+            "count": 19
         },
         "SnowballTarget.Policy.Beta.mean": {
+            "value": 1.849725714285702e-05,
+            "min": 1.849725714285702e-05,
+            "max": 0.001357185942857142,
+            "count": 19
         },
         "SnowballTarget.Policy.Beta.sum": {
+            "value": 1.849725714285702e-05,
+            "min": 1.849725714285702e-05,
+            "max": 0.001357185942857142,
+            "count": 19
         }
     },
     "metadata": {
         "timer_format_version": "0.1.0",
+        "start_time_seconds": "1735996791",
         "python_version": "3.10.12 (main, Nov  6 2024, 20:22:13) [GCC 11.4.0]",
+        "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget2 --no-graphics --resume",
         "mlagents_version": "1.2.0.dev0",
         "mlagents_envs_version": "1.2.0.dev0",
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "2.5.1+cu121",
         "numpy_version": "1.23.5",
+        "end_time_seconds": "1735997191"
     },
+    "total": 399.9202619810003,
     "count": 1,
+    "self": 0.4796982510004,
     "children": {
         "run_training.setup": {
+            "total": 0.0578861000001325,
             "count": 1,
+            "self": 0.0578861000001325
         },
         "TrainerController.start_learning": {
+            "total": 399.38267762999976,
             "count": 1,
+            "self": 0.3915310579748166,
             "children": {
                 "TrainerController._reset_env": {
+                    "total": 1.9863931160000448,
                     "count": 1,
+                    "self": 1.9863931160000448
                 },
                 "TrainerController.advance": {
+                    "total": 396.91193451302524,
+                    "count": 18192,
+                    "self": 0.4041940640381654,
                     "children": {
                         "env_step": {
+                            "total": 313.65146303799315,
+                            "count": 18192,
+                            "self": 237.38310407998324,
                             "children": {
                                 "SubprocessEnvManager._take_step": {
+                                    "total": 76.02799335198642,
+                                    "count": 18192,
+                                    "self": 1.3212031129937714,
                                     "children": {
                                         "TorchPolicy.evaluate": {
+                                            "total": 74.70679023899265,
+                                            "count": 18192,
+                                            "self": 74.70679023899265
                                         }
                                     }
                                 },
                                 "workers": {
+                                    "total": 0.240365606023488,
+                                    "count": 18192,
                                     "self": 0.0,
                                     "children": {
                                         "worker_root": {
+                                            "total": 397.9537662330033,
+                                            "count": 18192,
                                             "is_parallel": true,
+                                            "self": 190.60895667900672,
                                             "children": {
                                                 "run_training.setup": {
                                                     "total": 0.0,
                                                     "self": 0.0,
                                                     "children": {
                                                         "steps_from_proto": {
+                                                            "total": 0.002276298999959181,
                                                             "count": 1,
                                                             "is_parallel": true,
+                                                            "self": 0.000686218000282679,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
+                                                                    "total": 0.001590080999676502,
                                                                     "count": 10,
                                                                     "is_parallel": true,
+                                                                    "self": 0.001590080999676502
                                                                 }
                                                             }
                                                         },
                                                         "UnityEnvironment.step": {
+                                                            "total": 0.03597535900007642,
                                                             "count": 1,
                                                             "is_parallel": true,
+                                                            "self": 0.0007059810000100697,
                                                             "children": {
                                                                 "UnityEnvironment._generate_step_input": {
+                                                                    "total": 0.0004053479999583942,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.0004053479999583942
                                                                 },
                                                                 "communicator.exchange": {
+                                                                    "total": 0.032811723000122583,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.032811723000122583
                                                                 },
                                                                 "steps_from_proto": {
+                                                                    "total": 0.002052306999985376,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.0003964780003116175,
                                                                     "children": {
                                                                         "_process_rank_one_or_two_observation": {
+                                                                            "total": 0.0016558289996737585,
                                                                             "count": 10,
                                                                             "is_parallel": true,
+                                                                            "self": 0.0016558289996737585
                                                                         }
                                                                     }
                                                                 }
                                                     }
                                                 },
                                                 "UnityEnvironment.step": {
+                                                    "total": 207.34480955399658,
+                                                    "count": 18191,
                                                     "is_parallel": true,
+                                                    "self": 10.10729122898806,
                                                     "children": {
                                                         "UnityEnvironment._generate_step_input": {
+                                                            "total": 5.548815729996477,
+                                                            "count": 18191,
                                                             "is_parallel": true,
+                                                            "self": 5.548815729996477
                                                         },
                                                         "communicator.exchange": {
+                                                            "total": 158.47915548401443,
+                                                            "count": 18191,
                                                             "is_parallel": true,
+                                                            "self": 158.47915548401443
                                                         },
                                                         "steps_from_proto": {
+                                                            "total": 33.20954711099762,
+                                                            "count": 18191,
                                                             "is_parallel": true,
+                                                            "self": 6.0152952949040355,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
+                                                                    "total": 27.194251816093583,
+                                                                    "count": 181910,
                                                                     "is_parallel": true,
+                                                                    "self": 27.194251816093583
                                                                 }
                                                             }
                                                         }
                             }
                         },
                         "trainer_advance": {
+                            "total": 82.85627741099393,
+                            "count": 18192,
+                            "self": 0.43775320799977635,
                             "children": {
                                 "process_trajectory": {
+                                    "total": 26.99354049599424,
+                                    "count": 18192,
+                                    "self": 26.54805537999414,
                                     "children": {
                                         "RLTrainer._checkpoint": {
+                                            "total": 0.4454851160000999,
+                                            "count": 4,
+                                            "self": 0.4454851160000999
                                         }
                                     }
                                 },
                                 "_update_policy": {
+                                    "total": 55.42498370699991,
+                                    "count": 19,
+                                    "self": 37.852424140002086,
                                     "children": {
                                         "TorchPPOOptimizer.update": {
+                                            "total": 17.572559566997825,
+                                            "count": 1155,
+                                            "self": 17.572559566997825
                                         }
                                     }
                                 }
                     }
                 },
                 "trainer_threads": {
+                    "total": 8.659999366500415e-07,
                     "count": 1,
+                    "self": 8.659999366500415e-07
                 },
                 "TrainerController._save_models": {
+                    "total": 0.09281807699971978,
                     "count": 1,
+                    "self": 0.0011537249997672916,
                     "children": {
                         "RLTrainer._checkpoint": {
+                            "total": 0.09166435199995249,
                             "count": 1,
+                            "self": 0.09166435199995249
                         }
                     }
                 }

run_logs/training_status.json CHANGED Viewed

@@ -1,51 +1,6 @@
 {
     "SnowballTarget": {
         "checkpoints": [
-            {
-                "steps": 99960,
-                "file_path": "results/SnowballTarget2/SnowballTarget/SnowballTarget-99960.onnx",
-                "reward": 11.818181818181818,
-                "creation_time": 1735995742.583181,
-                "auxillary_file_paths": [
-                    "results/SnowballTarget2/SnowballTarget/SnowballTarget-99960.pt"
-                ]
-            },
-            {
-                "steps": 149984,
-                "file_path": "results/SnowballTarget2/SnowballTarget/SnowballTarget-149984.onnx",
-                "reward": 14.045454545454545,
-                "creation_time": 1735995840.8040826,
-                "auxillary_file_paths": [
-                    "results/SnowballTarget2/SnowballTarget/SnowballTarget-149984.pt"
-                ]
-            },
-            {
-                "steps": 199984,
-                "file_path": "results/SnowballTarget2/SnowballTarget/SnowballTarget-199984.onnx",
-                "reward": null,
-                "creation_time": 1735995940.2837977,
-                "auxillary_file_paths": [
-                    "results/SnowballTarget2/SnowballTarget/SnowballTarget-199984.pt"
-                ]
-            },
-            {
-                "steps": 249944,
-                "file_path": "results/SnowballTarget2/SnowballTarget/SnowballTarget-249944.onnx",
-                "reward": 19.15909090909091,
-                "creation_time": 1735996037.2722485,
-                "auxillary_file_paths": [
-                    "results/SnowballTarget2/SnowballTarget/SnowballTarget-249944.pt"
-                ]
-            },
-            {
-                "steps": 299968,
-                "file_path": "results/SnowballTarget2/SnowballTarget/SnowballTarget-299968.onnx",
-                "reward": 20.636363636363637,
-                "creation_time": 1735996138.734955,
-                "auxillary_file_paths": [
-                    "results/SnowballTarget2/SnowballTarget/SnowballTarget-299968.pt"
-                ]
-            },
             {
                 "steps": 349992,
                 "file_path": "results/SnowballTarget2/SnowballTarget/SnowballTarget-349992.onnx",
@@ -90,15 +45,60 @@
                 "auxillary_file_paths": [
                     "results/SnowballTarget2/SnowballTarget/SnowballTarget-500104.pt"
                 ]
             }
         ],
         "final_checkpoint": {
-            "steps": 500104,
             "file_path": "results/SnowballTarget2/SnowballTarget.onnx",
-            "reward": 24.681818181818183,
-            "creation_time": 1735996536.097647,
             "auxillary_file_paths": [
-                "results/SnowballTarget2/SnowballTarget/SnowballTarget-500104.pt"
             ]
         }
     },

 {
     "SnowballTarget": {
         "checkpoints": [
             {
                 "steps": 349992,
                 "file_path": "results/SnowballTarget2/SnowballTarget/SnowballTarget-349992.onnx",
                 "auxillary_file_paths": [
                     "results/SnowballTarget2/SnowballTarget/SnowballTarget-500104.pt"
                 ]
+            },
+            {
+                "steps": 549976,
+                "file_path": "results/SnowballTarget2/SnowballTarget/SnowballTarget-549976.onnx",
+                "reward": 24.757575757575758,
+                "creation_time": 1735996891.9949698,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget2/SnowballTarget/SnowballTarget-549976.pt"
+                ]
+            },
+            {
+                "steps": 599936,
+                "file_path": "results/SnowballTarget2/SnowballTarget/SnowballTarget-599936.onnx",
+                "reward": 26.181818181818183,
+                "creation_time": 1735996992.509469,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget2/SnowballTarget/SnowballTarget-599936.pt"
+                ]
+            },
+            {
+                "steps": 649960,
+                "file_path": "results/SnowballTarget2/SnowballTarget/SnowballTarget-649960.onnx",
+                "reward": 25.636363636363637,
+                "creation_time": 1735997092.3204386,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget2/SnowballTarget/SnowballTarget-649960.pt"
+                ]
+            },
+            {
+                "steps": 699960,
+                "file_path": "results/SnowballTarget2/SnowballTarget/SnowballTarget-699960.onnx",
+                "reward": null,
+                "creation_time": 1735997190.804446,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget2/SnowballTarget/SnowballTarget-699960.pt"
+                ]
+            },
+            {
+                "steps": 700216,
+                "file_path": "results/SnowballTarget2/SnowballTarget/SnowballTarget-700216.onnx",
+                "reward": null,
+                "creation_time": 1735997190.9208763,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget2/SnowballTarget/SnowballTarget-700216.pt"
+                ]
             }
         ],
         "final_checkpoint": {
+            "steps": 700216,
             "file_path": "results/SnowballTarget2/SnowballTarget.onnx",
+            "reward": null,
+            "creation_time": 1735997190.9208763,
             "auxillary_file_paths": [
+                "results/SnowballTarget2/SnowballTarget/SnowballTarget-700216.pt"
             ]
         }
     },