Weiming1122 commited on Dec 28, 2023

Commit

c21121d

1 Parent(s): 73daf80

First Push

Browse files

Files changed (18) hide show

SnowballTarget.onnx +2 -2
SnowballTarget/SnowballTarget-1499800.onnx +3 -0
SnowballTarget/SnowballTarget-1499800.pt +3 -0
SnowballTarget/SnowballTarget-1999800.onnx +3 -0
SnowballTarget/SnowballTarget-1999800.pt +3 -0
SnowballTarget/SnowballTarget-2002000.onnx +3 -0
SnowballTarget/SnowballTarget-2002000.pt +3 -0
SnowballTarget/SnowballTarget-499800.onnx +3 -0
SnowballTarget/SnowballTarget-499800.pt +3 -0
SnowballTarget/SnowballTarget-999800.onnx +3 -0
SnowballTarget/SnowballTarget-999800.pt +3 -0
SnowballTarget/checkpoint.pt +2 -2
SnowballTarget/events.out.tfevents.1703744705.013cfbc1c1fd.1595.0 +3 -0
config.json +1 -1
configuration.yaml +6 -6
run_logs/Player-0.log +16 -16
run_logs/timers.json +176 -176
run_logs/training_status.json +29 -29

SnowballTarget.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cd2dba79d43f01bb26643190830efee007fb702a0e5577e9abccd72a5025af0d
-size 650646

 version https://git-lfs.github.com/spec/v1
+oid sha256:950255ca55f381fa34c7b6f6969d854c8dfd3c67d1057a244172aa3a483c5d2f
+size 914755

SnowballTarget/SnowballTarget-1499800.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ab0ab123f2ee6001d41490673f6a059abe6d557053e48b5c3be79a292aeecfc5
+size 914755

SnowballTarget/SnowballTarget-1499800.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ad5df9418b592424eaef8b3e28c7895651312bc452bab7019c08e017c0d4c0cc
+size 5434534

SnowballTarget/SnowballTarget-1999800.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:950255ca55f381fa34c7b6f6969d854c8dfd3c67d1057a244172aa3a483c5d2f
+size 914755

SnowballTarget/SnowballTarget-1999800.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:062b9c9e85b5273a11e675b3b612c69b86167dc424f214a8354861383a904d02
+size 5434534

SnowballTarget/SnowballTarget-2002000.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:950255ca55f381fa34c7b6f6969d854c8dfd3c67d1057a244172aa3a483c5d2f
+size 914755

SnowballTarget/SnowballTarget-2002000.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dc88f8fdd31501ff96b22ad439684b715929ff2a65d8c1a70f64e35115111875
+size 5434534

SnowballTarget/SnowballTarget-499800.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cdc33a117505eb9c78c9663f15872548706b4dbb4c1581d363bf2208cba6b0d1
+size 914755

SnowballTarget/SnowballTarget-499800.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:733380eec82c2792c52ce3b1dcb462a8b6260a03d6061be4e59fe85a689daf81
+size 5434379

SnowballTarget/SnowballTarget-999800.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0046cea82e73e5ef68f8448dd945ee494ee9e01c95fc70957331ed488438e87b
+size 914755

SnowballTarget/SnowballTarget-999800.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a389de0c39d65553f78d55cdfb298348f56de65aeb92bb19a76c76f398af6671
+size 5434379

SnowballTarget/checkpoint.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b3f6c82ea38e791c21420195edddd70a81dfe6177856617535df342b3447ee84
-size 3849250

 version https://git-lfs.github.com/spec/v1
+oid sha256:48b1acd7388f806368b8f40d6186b6b1bcb1b57acb6982cb5d6a206bda9ee726
+size 5433378

SnowballTarget/events.out.tfevents.1703744705.013cfbc1c1fd.1595.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:53e47c54ffe29c9d5ade86d4bad145cd26bf05b321dff0bc82189ef91f9ccbc7
+size 39769

config.json CHANGED Viewed

@@ -1 +1 @@

- {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 128, "buffer_size": ~~2048~~, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": ~~50000~~, "network_settings": {"normalize": false, "hidden_units": 256, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "even_checkpoints": false, "max_steps": ~~200000~~, "time_horizon": 64, "summary_freq": ~~10000~~, "threaded": true, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SnowballTarget/SnowballTarget", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SnowballTarget1", "initialize_from": null, "load_model": false, "resume": false, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

+ {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 128, "buffer_size": 10240, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 500000, "network_settings": {"normalize": false, "hidden_units": 256, "num_layers": 3, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "even_checkpoints": false, "max_steps": 2000000, "time_horizon": 256, "summary_freq": 50000, "threaded": true, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SnowballTarget/SnowballTarget", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SnowballTarget1", "initialize_from": null, "load_model": false, "resume": false, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

configuration.yaml CHANGED Viewed

@@ -4,7 +4,7 @@ behaviors:
     trainer_type: ppo
     hyperparameters:
       batch_size: 128
-      buffer_size: 2048
       learning_rate: 0.0003
       beta: 0.005
       epsilon: 0.2
@@ -14,11 +14,11 @@ behaviors:
       learning_rate_schedule: linear
       beta_schedule: linear
       epsilon_schedule: linear
-    checkpoint_interval: 50000
     network_settings:
       normalize: false
       hidden_units: 256
-      num_layers: 2
       vis_encode_type: simple
       memory: null
       goal_conditioning_type: hyper
@@ -38,9 +38,9 @@ behaviors:
     init_path: null
     keep_checkpoints: 10
     even_checkpoints: false
-    max_steps: 200000
-    time_horizon: 64
-    summary_freq: 10000
     threaded: true
     self_play: null
     behavioral_cloning: null

     trainer_type: ppo
     hyperparameters:
       batch_size: 128
+      buffer_size: 10240
       learning_rate: 0.0003
       beta: 0.005
       epsilon: 0.2
       learning_rate_schedule: linear
       beta_schedule: linear
       epsilon_schedule: linear
+    checkpoint_interval: 500000
     network_settings:
       normalize: false
       hidden_units: 256
+      num_layers: 3
       vis_encode_type: simple
       memory: null
       goal_conditioning_type: hyper
     init_path: null
     keep_checkpoints: 10
     even_checkpoints: false
+    max_steps: 2000000
+    time_horizon: 256
+    summary_freq: 50000
     threaded: true
     self_play: null
     behavioral_cloning: null

run_logs/Player-0.log CHANGED Viewed

@@ -34,7 +34,7 @@ ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM default
 FMOD failed to initialize the output device.: "Error initializing output device. " (60)
 FMOD initialized on nosound output
 Begin MonoManager ReloadAssembly
-- Completed reload, in  0.091 seconds
 ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
@@ -45,7 +45,7 @@ ERROR: Shader Standard shader is not supported on this GPU (none of subshaders/f
 WARNING: Shader Unsupported: 'Standard' - All subshaders removed
 WARNING: Shader Did you use #pragma only_renderers and omit this platform?
 WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
-UnloadTime: 0.887692 ms
 ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 requesting resize 84 x 84
 Setting up 1 worker threads for Enlighten.
@@ -53,7 +53,7 @@ Memory Statistics:
 [ALLOC_TEMP_TLS] TLS Allocator
   StackAllocators :
     [ALLOC_TEMP_MAIN]
-      Peak usage frame count: [8.0 KB-16.0 KB]: 5368 frames, [16.0 KB-32.0 KB]: 91 frames, [2.0 MB-4.0 MB]: 1 frames
       Initial Block Size 4.0 MB
       Current Block Size 4.0 MB
       Peak Allocated Bytes 2.0 MB
@@ -169,22 +169,22 @@ Memory Statistics:
       Peak Allocated Bytes 0 B
       Overflow Count 0
 [ALLOC_DEFAULT] Dual Thread Allocator
-  Peak main deferred allocation count 40
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_DEFAULT_MAIN]
-      Peak usage frame count: [4.0 MB-8.0 MB]: 5460 frames
       Requested Block Size 16.0 MB
-      Peak Block count 1
-      Peak Allocated memory 6.6 MB
       Peak Large allocation bytes 0 B
     [ALLOC_DEFAULT_THREAD]
-      Peak usage frame count: [16.0 MB-32.0 MB]: 5460 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
-      Peak Allocated memory 17.8 MB
       Peak Large allocation bytes 16.0 MB
 [ALLOC_TEMP_JOB_1_FRAME]
   Initial Block Size 2.0 MB
@@ -213,13 +213,13 @@ Memory Statistics:
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_GFX_MAIN]
-      Peak usage frame count: [32.0 KB-64.0 KB]: 4535 frames, [64.0 KB-128.0 KB]: 925 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
-      Peak Allocated memory 67.7 KB
       Peak Large allocation bytes 0 B
     [ALLOC_GFX_THREAD]
-      Peak usage frame count: [32.0 KB-64.0 KB]: 5460 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 39.6 KB
@@ -231,13 +231,13 @@ Memory Statistics:
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_CACHEOBJECTS_MAIN]
-      Peak usage frame count: [0.5 MB-1.0 MB]: 5460 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 0.6 MB
       Peak Large allocation bytes 0 B
     [ALLOC_CACHEOBJECTS_THREAD]
-      Peak usage frame count: [0.5 MB-1.0 MB]: 5459 frames, [2.0 MB-4.0 MB]: 1 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 2.2 MB
@@ -249,13 +249,13 @@ Memory Statistics:
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_TYPETREE_MAIN]
-      Peak usage frame count: [0-1.0 KB]: 5460 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.0 KB
       Peak Large allocation bytes 0 B
     [ALLOC_TYPETREE_THREAD]
-      Peak usage frame count: [1.0 KB-2.0 KB]: 5460 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.7 KB

 FMOD failed to initialize the output device.: "Error initializing output device. " (60)
 FMOD initialized on nosound output
 Begin MonoManager ReloadAssembly
+- Completed reload, in  0.094 seconds
 ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 WARNING: Shader Unsupported: 'Standard' - All subshaders removed
 WARNING: Shader Did you use #pragma only_renderers and omit this platform?
 WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
+UnloadTime: 0.784973 ms
 ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 requesting resize 84 x 84
 Setting up 1 worker threads for Enlighten.
 [ALLOC_TEMP_TLS] TLS Allocator
   StackAllocators :
     [ALLOC_TEMP_MAIN]
+      Peak usage frame count: [8.0 KB-16.0 KB]: 53690 frames, [16.0 KB-32.0 KB]: 910 frames, [2.0 MB-4.0 MB]: 1 frames
       Initial Block Size 4.0 MB
       Current Block Size 4.0 MB
       Peak Allocated Bytes 2.0 MB
       Peak Allocated Bytes 0 B
       Overflow Count 0
 [ALLOC_DEFAULT] Dual Thread Allocator
+  Peak main deferred allocation count 45
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_DEFAULT_MAIN]
+      Peak usage frame count: [4.0 MB-8.0 MB]: 12791 frames, [8.0 MB-16.0 MB]: 26996 frames, [16.0 MB-32.0 MB]: 14814 frames
       Requested Block Size 16.0 MB
+      Peak Block count 2
+      Peak Allocated memory 24.3 MB
       Peak Large allocation bytes 0 B
     [ALLOC_DEFAULT_THREAD]
+      Peak usage frame count: [16.0 MB-32.0 MB]: 54601 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
+      Peak Allocated memory 17.7 MB
       Peak Large allocation bytes 16.0 MB
 [ALLOC_TEMP_JOB_1_FRAME]
   Initial Block Size 2.0 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_GFX_MAIN]
+      Peak usage frame count: [32.0 KB-64.0 KB]: 52658 frames, [64.0 KB-128.0 KB]: 1943 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
+      Peak Allocated memory 66.4 KB
       Peak Large allocation bytes 0 B
     [ALLOC_GFX_THREAD]
+      Peak usage frame count: [32.0 KB-64.0 KB]: 54601 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 39.6 KB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_CACHEOBJECTS_MAIN]
+      Peak usage frame count: [0.5 MB-1.0 MB]: 54601 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 0.6 MB
       Peak Large allocation bytes 0 B
     [ALLOC_CACHEOBJECTS_THREAD]
+      Peak usage frame count: [0.5 MB-1.0 MB]: 54600 frames, [2.0 MB-4.0 MB]: 1 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 2.2 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_TYPETREE_MAIN]
+      Peak usage frame count: [0-1.0 KB]: 54601 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.0 KB
       Peak Large allocation bytes 0 B
     [ALLOC_TYPETREE_THREAD]
+      Peak usage frame count: [1.0 KB-2.0 KB]: 54601 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.7 KB

run_logs/timers.json CHANGED Viewed

@@ -2,153 +2,153 @@
     "name": "root",
     "gauges": {
         "SnowballTarget.Policy.Entropy.mean": {
-            "value": 0.8669962286949158,
-            "min": 0.8669962286949158,
-            "max": 2.869570255279541,
-            "count": 20
         },
         "SnowballTarget.Policy.Entropy.sum": {
-            "value": 8287.6171875,
-            "min": 8287.6171875,
-            "max": 29387.26953125,
-            "count": 20
         },
         "SnowballTarget.Step.mean": {
-            "value": 199984.0,
-            "min": 9952.0,
-            "max": 199984.0,
-            "count": 20
         },
         "SnowballTarget.Step.sum": {
-            "value": 199984.0,
-            "min": 9952.0,
-            "max": 199984.0,
-            "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
-            "value": 12.66847038269043,
-            "min": 0.45318853855133057,
-            "max": 12.66847038269043,
-            "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
-            "value": 2470.351806640625,
-            "min": 87.9185791015625,
-            "max": 2574.646484375,
-            "count": 20
         },
-        "SnowballTarget.Environment.EpisodeLength.mean": {
-            "value": 199.0,
-            "min": 199.0,
-            "max": 199.0,
-            "count": 20
         },
-        "SnowballTarget.Environment.EpisodeLength.sum": {
-            "value": 8756.0,
-            "min": 8756.0,
-            "max": 10945.0,
-            "count": 20
         },
         "SnowballTarget.Losses.PolicyLoss.mean": {
-            "value": 0.06753355493299965,
-            "min": 0.06494867389750046,
-            "max": 0.07367765676691289,
-            "count": 20
         },
         "SnowballTarget.Losses.PolicyLoss.sum": {
-            "value": 0.2701342197319986,
-            "min": 0.26150085703428727,
-            "max": 0.3518778981381853,
-            "count": 20
         },
         "SnowballTarget.Losses.ValueLoss.mean": {
-            "value": 0.18394062193293198,
-            "min": 0.11935577595688622,
-            "max": 0.3019716292619705,
-            "count": 20
         },
         "SnowballTarget.Losses.ValueLoss.sum": {
-            "value": 0.7357624877317279,
-            "min": 0.4774231038275449,
-            "max": 1.349198090095146,
-            "count": 20
         },
         "SnowballTarget.Policy.LearningRate.mean": {
-            "value": 8.082097306000005e-06,
-            "min": 8.082097306000005e-06,
-            "max": 0.000291882002706,
-            "count": 20
         },
         "SnowballTarget.Policy.LearningRate.sum": {
-            "value": 3.232838922400002e-05,
-            "min": 3.232838922400002e-05,
-            "max": 0.00138516003828,
-            "count": 20
         },
         "SnowballTarget.Policy.Epsilon.mean": {
-            "value": 0.10269400000000001,
-            "min": 0.10269400000000001,
-            "max": 0.19729400000000002,
-            "count": 20
         },
         "SnowballTarget.Policy.Epsilon.sum": {
-            "value": 0.41077600000000003,
-            "min": 0.41077600000000003,
-            "max": 0.96172,
-            "count": 20
         },
         "SnowballTarget.Policy.Beta.mean": {
-            "value": 0.0001444306000000001,
-            "min": 0.0001444306000000001,
-            "max": 0.0048649706,
-            "count": 20
         },
         "SnowballTarget.Policy.Beta.sum": {
-            "value": 0.0005777224000000004,
-            "min": 0.0005777224000000004,
-            "max": 0.023089828,
-            "count": 20
-        },
-        "SnowballTarget.Environment.CumulativeReward.mean": {
-            "value": 24.977272727272727,
-            "min": 3.340909090909091,
-            "max": 24.977272727272727,
-            "count": 20
-        },
-        "SnowballTarget.Environment.CumulativeReward.sum": {
-            "value": 1099.0,
-            "min": 147.0,
-            "max": 1343.0,
-            "count": 20
-        },
-        "SnowballTarget.Policy.ExtrinsicReward.mean": {
-            "value": 24.977272727272727,
-            "min": 3.340909090909091,
-            "max": 24.977272727272727,
-            "count": 20
-        },
-        "SnowballTarget.Policy.ExtrinsicReward.sum": {
-            "value": 1099.0,
-            "min": 147.0,
-            "max": 1343.0,
-            "count": 20
         },
         "SnowballTarget.IsTraining.mean": {
             "value": 1.0,
             "min": 1.0,
             "max": 1.0,
-            "count": 20
         },
         "SnowballTarget.IsTraining.sum": {
             "value": 1.0,
             "min": 1.0,
             "max": 1.0,
-            "count": 20
         }
     },
     "metadata": {
         "timer_format_version": "0.1.0",
-        "start_time_seconds": "1703733181",
         "python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
         "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget1 --no-graphics",
         "mlagents_version": "1.1.0.dev0",
@@ -156,59 +156,59 @@
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "2.1.2+cu121",
         "numpy_version": "1.23.5",
-        "end_time_seconds": "1703733626"
     },
-    "total": 444.9509761369999,
     "count": 1,
-    "self": 0.4379683639998575,
     "children": {
         "run_training.setup": {
-            "total": 0.053479809999998906,
             "count": 1,
-            "self": 0.053479809999998906
         },
         "TrainerController.start_learning": {
-            "total": 444.459527963,
             "count": 1,
-            "self": 0.5459963899983222,
             "children": {
                 "TrainerController._reset_env": {
-                    "total": 3.2033515960000614,
                     "count": 1,
-                    "self": 3.2033515960000614
                 },
                 "TrainerController.advance": {
-                    "total": 440.62231021600155,
-                    "count": 18200,
-                    "self": 0.2626727869825345,
                     "children": {
                         "env_step": {
-                            "total": 440.359637429019,
-                            "count": 18200,
-                            "self": 288.21511279604624,
                             "children": {
                                 "SubprocessEnvManager._take_step": {
-                                    "total": 151.86545625198835,
-                                    "count": 18200,
-                                    "self": 1.4392349629639511,
                                     "children": {
                                         "TorchPolicy.evaluate": {
-                                            "total": 150.4262212890244,
-                                            "count": 18200,
-                                            "self": 150.4262212890244
                                         }
                                     }
                                 },
                                 "workers": {
-                                    "total": 0.27906838098442677,
-                                    "count": 18200,
                                     "self": 0.0,
                                     "children": {
                                         "worker_root": {
-                                            "total": 443.3267502729932,
-                                            "count": 18200,
                                             "is_parallel": true,
-                                            "self": 219.03763023398915,
                                             "children": {
                                                 "run_training.setup": {
                                                     "total": 0.0,
@@ -217,48 +217,48 @@
                                                     "self": 0.0,
                                                     "children": {
                                                         "steps_from_proto": {
-                                                            "total": 0.0050096449999728065,
                                                             "count": 1,
                                                             "is_parallel": true,
-                                                            "self": 0.0034699119997867456,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
-                                                                    "total": 0.001539733000186061,
                                                                     "count": 10,
                                                                     "is_parallel": true,
-                                                                    "self": 0.001539733000186061
                                                                 }
                                                             }
                                                         },
                                                         "UnityEnvironment.step": {
-                                                            "total": 0.051181425999971,
                                                             "count": 1,
                                                             "is_parallel": true,
-                                                            "self": 0.0007588099998656617,
                                                             "children": {
                                                                 "UnityEnvironment._generate_step_input": {
-                                                                    "total": 0.00041097300004366843,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.00041097300004366843
                                                                 },
                                                                 "communicator.exchange": {
-                                                                    "total": 0.04814685999997437,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.04814685999997437
                                                                 },
                                                                 "steps_from_proto": {
-                                                                    "total": 0.0018647830000873,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.0003552319999471365,
                                                                     "children": {
                                                                         "_process_rank_one_or_two_observation": {
-                                                                            "total": 0.0015095510001401635,
                                                                             "count": 10,
                                                                             "is_parallel": true,
-                                                                            "self": 0.0015095510001401635
                                                                         }
                                                                     }
                                                                 }
@@ -267,34 +267,34 @@
                                                     }
                                                 },
                                                 "UnityEnvironment.step": {
-                                                    "total": 224.28912003900405,
-                                                    "count": 18199,
                                                     "is_parallel": true,
-                                                    "self": 10.658013661026985,
                                                     "children": {
                                                         "UnityEnvironment._generate_step_input": {
-                                                            "total": 5.23273210699881,
-                                                            "count": 18199,
                                                             "is_parallel": true,
-                                                            "self": 5.23273210699881
                                                         },
                                                         "communicator.exchange": {
-                                                            "total": 174.956716884961,
-                                                            "count": 18199,
                                                             "is_parallel": true,
-                                                            "self": 174.956716884961
                                                         },
                                                         "steps_from_proto": {
-                                                            "total": 33.441657386017255,
-                                                            "count": 18199,
                                                             "is_parallel": true,
-                                                            "self": 6.176670708015649,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
-                                                                    "total": 27.264986678001605,
-                                                                    "count": 181990,
                                                                     "is_parallel": true,
-                                                                    "self": 27.264986678001605
                                                                 }
                                                             }
                                                         }
@@ -309,9 +309,9 @@
                     }
                 },
                 "trainer_threads": {
-                    "total": 0.00011886200013577763,
                     "count": 1,
-                    "self": 0.00011886200013577763,
                     "children": {
                         "thread_root": {
                             "total": 0.0,
@@ -320,36 +320,36 @@
                             "self": 0.0,
                             "children": {
                                 "trainer_advance": {
-                                    "total": 435.2241449229941,
-                                    "count": 677405,
                                     "is_parallel": true,
-                                    "self": 13.744515058067122,
                                     "children": {
                                         "process_trajectory": {
-                                            "total": 239.4991322549257,
-                                            "count": 677405,
                                             "is_parallel": true,
-                                            "self": 238.5485157069255,
                                             "children": {
                                                 "RLTrainer._checkpoint": {
-                                                    "total": 0.9506165480001982,
                                                     "count": 4,
                                                     "is_parallel": true,
-                                                    "self": 0.9506165480001982
                                                 }
                                             }
                                         },
                                         "_update_policy": {
-                                            "total": 181.9804976100013,
-                                            "count": 90,
                                             "is_parallel": true,
-                                            "self": 57.51711164299843,
                                             "children": {
                                                 "TorchPPOOptimizer.update": {
-                                                    "total": 124.46338596700286,
-                                                    "count": 4587,
                                                     "is_parallel": true,
-                                                    "self": 124.46338596700286
                                                 }
                                             }
                                         }
@@ -360,14 +360,14 @@
                     }
                 },
                 "TrainerController._save_models": {
-                    "total": 0.08775089899995692,
                     "count": 1,
-                    "self": 0.0009682820000307402,
                     "children": {
                         "RLTrainer._checkpoint": {
-                            "total": 0.08678261699992618,
                             "count": 1,
-                            "self": 0.08678261699992618
                         }
                     }
                 }

     "name": "root",
     "gauges": {
         "SnowballTarget.Policy.Entropy.mean": {
+            "value": 0.839410126209259,
+            "min": 0.839410126209259,
+            "max": 2.844252109527588,
+            "count": 40
         },
         "SnowballTarget.Policy.Entropy.sum": {
+            "value": 42363.3515625,
+            "min": 40732.9296875,
+            "max": 144451.03125,
+            "count": 40
+        },
+        "SnowballTarget.Environment.EpisodeLength.mean": {
+            "value": 199.0,
+            "min": 199.0,
+            "max": 199.0,
+            "count": 40
+        },
+        "SnowballTarget.Environment.EpisodeLength.sum": {
+            "value": 50347.0,
+            "min": 48158.0,
+            "max": 52536.0,
+            "count": 40
         },
         "SnowballTarget.Step.mean": {
+            "value": 1999800.0,
+            "min": 49800.0,
+            "max": 1999800.0,
+            "count": 40
         },
         "SnowballTarget.Step.sum": {
+            "value": 1999800.0,
+            "min": 49800.0,
+            "max": 1999800.0,
+            "count": 40
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
+            "value": 14.501752853393555,
+            "min": 0.5022461414337158,
+            "max": 14.501752853393555,
+            "count": 40
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
+            "value": 3625.438232421875,
+            "min": 125.05929565429688,
+            "max": 3625.438232421875,
+            "count": 40
         },
+        "SnowballTarget.Environment.CumulativeReward.mean": {
+            "value": 28.388,
+            "min": 5.008032128514056,
+            "max": 28.448,
+            "count": 40
         },
+        "SnowballTarget.Environment.CumulativeReward.sum": {
+            "value": 7097.0,
+            "min": 1247.0,
+            "max": 7112.0,
+            "count": 40
+        },
+        "SnowballTarget.Policy.ExtrinsicReward.mean": {
+            "value": 28.388,
+            "min": 5.008032128514056,
+            "max": 28.448,
+            "count": 40
+        },
+        "SnowballTarget.Policy.ExtrinsicReward.sum": {
+            "value": 7097.0,
+            "min": 1247.0,
+            "max": 7112.0,
+            "count": 40
         },
         "SnowballTarget.Losses.PolicyLoss.mean": {
+            "value": 0.069219311003226,
+            "min": 0.0659932713580287,
+            "max": 0.0739939942222383,
+            "count": 40
         },
         "SnowballTarget.Losses.PolicyLoss.sum": {
+            "value": 0.276877244012904,
+            "min": 0.2639730854321148,
+            "max": 0.3581072422068817,
+            "count": 40
         },
         "SnowballTarget.Losses.ValueLoss.mean": {
+            "value": 0.15687800026407428,
+            "min": 0.14771346322836815,
+            "max": 0.2919780290740378,
+            "count": 40
         },
         "SnowballTarget.Losses.ValueLoss.sum": {
+            "value": 0.6275120010562971,
+            "min": 0.6275120010562971,
+            "max": 1.3910198542445091,
+            "count": 40
         },
         "SnowballTarget.Policy.LearningRate.mean": {
+            "value": 3.825098724999995e-06,
+            "min": 3.825098724999995e-06,
+            "max": 0.00029587500137499996,
+            "count": 40
         },
         "SnowballTarget.Policy.LearningRate.sum": {
+            "value": 1.530039489999998e-05,
+            "min": 1.530039489999998e-05,
+            "max": 0.0014422500192499998,
+            "count": 40
         },
         "SnowballTarget.Policy.Epsilon.mean": {
+            "value": 0.10127499999999999,
+            "min": 0.10127499999999999,
+            "max": 0.19862500000000005,
+            "count": 40
         },
         "SnowballTarget.Policy.Epsilon.sum": {
+            "value": 0.40509999999999996,
+            "min": 0.40509999999999996,
+            "max": 0.9807500000000001,
+            "count": 40
         },
         "SnowballTarget.Policy.Beta.mean": {
+            "value": 7.362249999999992e-05,
+            "min": 7.362249999999992e-05,
+            "max": 0.0049313875,
+            "count": 40
         },
         "SnowballTarget.Policy.Beta.sum": {
+            "value": 0.0002944899999999997,
+            "min": 0.0002944899999999997,
+            "max": 0.024039425,
+            "count": 40
         },
         "SnowballTarget.IsTraining.mean": {
             "value": 1.0,
             "min": 1.0,
             "max": 1.0,
+            "count": 40
         },
         "SnowballTarget.IsTraining.sum": {
             "value": 1.0,
             "min": 1.0,
             "max": 1.0,
+            "count": 40
         }
     },
     "metadata": {
         "timer_format_version": "0.1.0",
+        "start_time_seconds": "1703744704",
         "python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
         "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget1 --no-graphics",
         "mlagents_version": "1.1.0.dev0",
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "2.1.2+cu121",
         "numpy_version": "1.23.5",
+        "end_time_seconds": "1703749228"
     },
+    "total": 4524.0049186979995,
     "count": 1,
+    "self": 0.6768422829991323,
     "children": {
         "run_training.setup": {
+            "total": 0.06769795000002432,
             "count": 1,
+            "self": 0.06769795000002432
         },
         "TrainerController.start_learning": {
+            "total": 4523.260378465,
             "count": 1,
+            "self": 6.153770934033673,
             "children": {
                 "TrainerController._reset_env": {
+                    "total": 3.387389077000023,
                     "count": 1,
+                    "self": 3.387389077000023
                 },
                 "TrainerController.advance": {
+                    "total": 4513.5815245649665,
+                    "count": 182002,
+                    "self": 2.794995134952842,
                     "children": {
                         "env_step": {
+                            "total": 4510.786529430014,
+                            "count": 182002,
+                            "self": 2907.504590901017,
                             "children": {
                                 "SubprocessEnvManager._take_step": {
+                                    "total": 1600.249445852959,
+                                    "count": 182002,
+                                    "self": 15.010505520020615,
                                     "children": {
                                         "TorchPolicy.evaluate": {
+                                            "total": 1585.2389403329385,
+                                            "count": 182002,
+                                            "self": 1585.2389403329385
                                         }
                                     }
                                 },
                                 "workers": {
+                                    "total": 3.032492676037407,
+                                    "count": 182002,
                                     "self": 0.0,
                                     "children": {
                                         "worker_root": {
+                                            "total": 4511.344607695967,
+                                            "count": 182002,
                                             "is_parallel": true,
+                                            "self": 2199.071089124015,
                                             "children": {
                                                 "run_training.setup": {
                                                     "total": 0.0,
                                                     "self": 0.0,
                                                     "children": {
                                                         "steps_from_proto": {
+                                                            "total": 0.004833086000019193,
                                                             "count": 1,
                                                             "is_parallel": true,
+                                                            "self": 0.003405404999966777,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
+                                                                    "total": 0.0014276810000524165,
                                                                     "count": 10,
                                                                     "is_parallel": true,
+                                                                    "self": 0.0014276810000524165
                                                                 }
                                                             }
                                                         },
                                                         "UnityEnvironment.step": {
+                                                            "total": 0.0377329269999791,
                                                             "count": 1,
                                                             "is_parallel": true,
+                                                            "self": 0.0007396139999968909,
                                                             "children": {
                                                                 "UnityEnvironment._generate_step_input": {
+                                                                    "total": 0.00040095899998959794,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.00040095899998959794
                                                                 },
                                                                 "communicator.exchange": {
+                                                                    "total": 0.034467437999978756,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.034467437999978756
                                                                 },
                                                                 "steps_from_proto": {
+                                                                    "total": 0.0021249160000138545,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.00041478200006395127,
                                                                     "children": {
                                                                         "_process_rank_one_or_two_observation": {
+                                                                            "total": 0.0017101339999499032,
                                                                             "count": 10,
                                                                             "is_parallel": true,
+                                                                            "self": 0.0017101339999499032
                                                                         }
                                                                     }
                                                                 }
                                                     }
                                                 },
                                                 "UnityEnvironment.step": {
+                                                    "total": 2312.273518571952,
+                                                    "count": 182001,
                                                     "is_parallel": true,
+                                                    "self": 110.96179828893128,
                                                     "children": {
                                                         "UnityEnvironment._generate_step_input": {
+                                                            "total": 53.66522611495839,
+                                                            "count": 182001,
                                                             "is_parallel": true,
+                                                            "self": 53.66522611495839
                                                         },
                                                         "communicator.exchange": {
+                                                            "total": 1805.0553392249547,
+                                                            "count": 182001,
                                                             "is_parallel": true,
+                                                            "self": 1805.0553392249547
                                                         },
                                                         "steps_from_proto": {
+                                                            "total": 342.5911549431076,
+                                                            "count": 182001,
                                                             "is_parallel": true,
+                                                            "self": 63.7990347122423,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
+                                                                    "total": 278.7921202308653,
+                                                                    "count": 1820010,
                                                                     "is_parallel": true,
+                                                                    "self": 278.7921202308653
                                                                 }
                                                             }
                                                         }
                     }
                 },
                 "trainer_threads": {
+                    "total": 0.001607125000191445,
                     "count": 1,
+                    "self": 0.001607125000191445,
                     "children": {
                         "thread_root": {
                             "total": 0.0,
                             "self": 0.0,
                             "children": {
                                 "trainer_advance": {
+                                    "total": 4457.231079032006,
+                                    "count": 6689180,
                                     "is_parallel": true,
+                                    "self": 142.82890651324124,
                                     "children": {
                                         "process_trajectory": {
+                                            "total": 2243.318894835765,
+                                            "count": 6689180,
                                             "is_parallel": true,
+                                            "self": 2242.5206855647652,
                                             "children": {
                                                 "RLTrainer._checkpoint": {
+                                                    "total": 0.7982092709999051,
                                                     "count": 4,
                                                     "is_parallel": true,
+                                                    "self": 0.7982092709999051
                                                 }
                                             }
                                         },
                                         "_update_policy": {
+                                            "total": 2071.0832776830002,
+                                            "count": 181,
                                             "is_parallel": true,
+                                            "self": 620.9278815499742,
                                             "children": {
                                                 "TorchPPOOptimizer.update": {
+                                                    "total": 1450.155396133026,
+                                                    "count": 46161,
                                                     "is_parallel": true,
+                                                    "self": 1450.155396133026
                                                 }
                                             }
                                         }
                     }
                 },
                 "TrainerController._save_models": {
+                    "total": 0.1360867639996286,
                     "count": 1,
+                    "self": 0.0017097370000556111,
                     "children": {
                         "RLTrainer._checkpoint": {
+                            "total": 0.134377026999573,
                             "count": 1,
+                            "self": 0.134377026999573
                         }
                     }
                 }

run_logs/training_status.json CHANGED Viewed

@@ -2,58 +2,58 @@
     "SnowballTarget": {
         "checkpoints": [
             {
-                "steps": 49936,
-                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-49936.onnx",
-                "reward": 12.636363636363637,
-                "creation_time": 1703733295.7324486,
                 "auxillary_file_paths": [
-                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-49936.pt"
                 ]
             },
             {
-                "steps": 99960,
-                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-99960.onnx",
-                "reward": 21.363636363636363,
-                "creation_time": 1703733407.587789,
                 "auxillary_file_paths": [
-                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-99960.pt"
                 ]
             },
             {
-                "steps": 149984,
-                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-149984.onnx",
-                "reward": 23.181818181818183,
-                "creation_time": 1703733517.5242794,
                 "auxillary_file_paths": [
-                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-149984.pt"
                 ]
             },
             {
-                "steps": 199984,
-                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-199984.onnx",
-                "reward": 24.363636363636363,
-                "creation_time": 1703733625.6377993,
                 "auxillary_file_paths": [
-                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-199984.pt"
                 ]
             },
             {
-                "steps": 200112,
-                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.onnx",
-                "reward": 24.363636363636363,
-                "creation_time": 1703733625.7565851,
                 "auxillary_file_paths": [
-                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
                 ]
             }
         ],
         "final_checkpoint": {
-            "steps": 200112,
             "file_path": "results/SnowballTarget1/SnowballTarget.onnx",
-            "reward": 24.363636363636363,
-            "creation_time": 1703733625.7565851,
             "auxillary_file_paths": [
-                "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
             ]
         }
     },

     "SnowballTarget": {
         "checkpoints": [
             {
+                "steps": 499800,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-499800.onnx",
+                "reward": 26.625,
+                "creation_time": 1703745843.0743196,
                 "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-499800.pt"
                 ]
             },
             {
+                "steps": 999800,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-999800.onnx",
+                "reward": 27.632653061224488,
+                "creation_time": 1703746971.4188666,
                 "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-999800.pt"
                 ]
             },
             {
+                "steps": 1499800,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-1499800.onnx",
+                "reward": 28.31578947368421,
+                "creation_time": 1703748101.412122,
                 "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-1499800.pt"
                 ]
             },
             {
+                "steps": 1999800,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-1999800.onnx",
+                "reward": 28.75,
+                "creation_time": 1703749227.0901036,
                 "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-1999800.pt"
                 ]
             },
             {
+                "steps": 2002000,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-2002000.onnx",
+                "reward": 28.927272727272726,
+                "creation_time": 1703749227.4071867,
                 "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-2002000.pt"
                 ]
             }
         ],
         "final_checkpoint": {
+            "steps": 2002000,
             "file_path": "results/SnowballTarget1/SnowballTarget.onnx",
+            "reward": 28.927272727272726,
+            "creation_time": 1703749227.4071867,
             "auxillary_file_paths": [
+                "results/SnowballTarget1/SnowballTarget/SnowballTarget-2002000.pt"
             ]
         }
     },