hartman23 commited on Dec 20, 2024

Commit

1ec3516

verified ·

1 Parent(s): a014b2f

Add first optimized SnowbalThrower

Browse files

Files changed (18) hide show

SnowballTarget.onnx +2 -2
SnowballTarget/SnowballTarget-149984.onnx +2 -2
SnowballTarget/SnowballTarget-149984.pt +2 -2
SnowballTarget/SnowballTarget-199984.onnx +2 -2
SnowballTarget/SnowballTarget-199984.pt +2 -2
SnowballTarget/SnowballTarget-200184.onnx +2 -2
SnowballTarget/SnowballTarget-200184.pt +2 -2
SnowballTarget/SnowballTarget-49936.onnx +2 -2
SnowballTarget/SnowballTarget-49936.pt +2 -2
SnowballTarget/SnowballTarget-99960.onnx +2 -2
SnowballTarget/SnowballTarget-99960.pt +2 -2
SnowballTarget/checkpoint.pt +2 -2
SnowballTarget/events.out.tfevents.1734712357.e5f9a005203d.18978.0 +3 -0
config.json +1 -1
configuration.yaml +11 -11
run_logs/Player-0.log +15 -15
run_logs/timers.json +131 -131
run_logs/training_status.json +21 -21

SnowballTarget.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4b81e5a96df91d78c21dcb723c7251ce2f2871f7ffc3f783878871bc524523c7
-size 485667

 version https://git-lfs.github.com/spec/v1
+oid sha256:da0f3b9a9bc306c307a978cfd73e9c2084ca146bef25aafa1f4d82d40214308d
+size 941878

SnowballTarget/SnowballTarget-149984.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5fb9cbf686798d422f938a4f0b62c9d4806928721ff2c0209883d62e98d5211f
-size 485667

 version https://git-lfs.github.com/spec/v1
+oid sha256:6f647896f05b419ed790eae5f2da6f8ae3ac56218c24a40ad80005f888ac0f63
+size 941878

SnowballTarget/SnowballTarget-149984.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5e3d6fbdd67caf05b08b9fab003ef13f159021b6a519112727a8cc16eda532e0
-size 2864907

 version https://git-lfs.github.com/spec/v1
+oid sha256:6175eba23ea975648028fe35e02ea47d204d458f3301d2bcf314e4fac7595431
+size 5589211

SnowballTarget/SnowballTarget-199984.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4b81e5a96df91d78c21dcb723c7251ce2f2871f7ffc3f783878871bc524523c7
-size 485667

 version https://git-lfs.github.com/spec/v1
+oid sha256:da0f3b9a9bc306c307a978cfd73e9c2084ca146bef25aafa1f4d82d40214308d
+size 941878

SnowballTarget/SnowballTarget-199984.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9eb982a4bd7a43e2aac177971aed0e71eb41ed72b6a6c076dd8e937941baa7a0
-size 2864907

 version https://git-lfs.github.com/spec/v1
+oid sha256:2820445ee639abc23e56b3c4d4d941c40e1a8710f8af7024bb645679d6f48642
+size 5589211

SnowballTarget/SnowballTarget-200184.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4b81e5a96df91d78c21dcb723c7251ce2f2871f7ffc3f783878871bc524523c7
-size 485667

 version https://git-lfs.github.com/spec/v1
+oid sha256:da0f3b9a9bc306c307a978cfd73e9c2084ca146bef25aafa1f4d82d40214308d
+size 941878

SnowballTarget/SnowballTarget-200184.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e2ebdd82b5201968002d9c22ff1b360cea64ead8c34240ddb273d7824f3712d5
-size 2864907

 version https://git-lfs.github.com/spec/v1
+oid sha256:ee42bd14f998083bd5d0d527642b1f7de329388db82eac42c29d00e682b025b2
+size 5589211

SnowballTarget/SnowballTarget-49936.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c2e0cb13d4886516279a9d5357cb710a8f35290543600d5096ccefb98b1ed85c
-size 485667

 version https://git-lfs.github.com/spec/v1
+oid sha256:f2d339482a6216fcf42bf72f731dd4e877d1d5f2ceb1af77fa75c6f587890e67
+size 941878

SnowballTarget/SnowballTarget-49936.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:267aa29e03f202a520aa6519639bf0b81edf1e69ea1a0cf924e5aa4721f81afc
-size 2864816

 version https://git-lfs.github.com/spec/v1
+oid sha256:d97ba229b2fb42e9b779f495890e863ce1acf332f10653f30c3e554f2c40e7bd
+size 5589136

SnowballTarget/SnowballTarget-99960.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:070ae9dfdd9a37d0ca6643f1b193e05e5be93d2b8e50e0a2d4010ac900e43268
-size 485667

 version https://git-lfs.github.com/spec/v1
+oid sha256:f2a6a8626f6a21da48ee65652b9595649c80bdfc5f51609589342986d8c72a75
+size 941878

SnowballTarget/SnowballTarget-99960.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7ef0c20427fab80137874adc9a3297a1373c35e565ad17011b9e2c2597341139
-size 2864816

 version https://git-lfs.github.com/spec/v1
+oid sha256:9012dd0af101791e7c6d7182ef5e8bd118a5853791c86f1e2a3dd83213242c3d
+size 5589136

SnowballTarget/checkpoint.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7fece49937c7e0c00f62c1148ee66ac3ed4cc03387fc5e5c9ddc7c98a09fed37
-size 2863906

 version https://git-lfs.github.com/spec/v1
+oid sha256:99088051f9ae6668e52fa3b18e71c1707a07952b9bc4164d4bba0970471066fd
+size 5588386

SnowballTarget/events.out.tfevents.1734712357.e5f9a005203d.18978.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4bc9e810da77196cf7858f1b35bc25935bf4cea377e5ad03bc16d6e95c1b3636
+size 30177

config.json CHANGED Viewed

@@ -1 +1 @@

- {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": ~~129~~, "buffer_size": ~~1172~~, "learning_rate": 0.~~005848717855174421~~, "beta": 0.~~0006933626020387194~~, "epsilon": 0.~~0015104254518785796~~, "lambd": 0.~~9809480780691303~~, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 50000, "network_settings": {"normalize": false, "hidden_units": ~~168~~, "num_layers": 3, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.~~9417107177844183~~, "strength": 0.~~9576267730399072~~, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "even_checkpoints": false, "max_steps": 200000, "time_horizon": 64, "summary_freq": 10000, "threaded": true, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SnowballTarget/SnowballTarget", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "~~SnowballTarget11~~", "initialize_from": null, "load_model": false, "resume": false, "force": true, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

+ {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 255, "buffer_size": 1051, "learning_rate": 0.0033585016653676788, "beta": 0.04458576263259719, "epsilon": 0.06481103071316076, "lambd": 0.9200382214218608, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 50000, "network_settings": {"normalize": false, "hidden_units": 332, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.9344680687013123, "strength": 0.7743161246844508, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "even_checkpoints": false, "max_steps": 200000, "time_horizon": 64, "summary_freq": 10000, "threaded": true, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SnowballTarget/SnowballTarget", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SnowballTarget14", "initialize_from": null, "load_model": false, "resume": false, "force": true, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

configuration.yaml CHANGED Viewed

@@ -3,12 +3,12 @@ behaviors:
   SnowballTarget:
     trainer_type: ppo
     hyperparameters:
-      batch_size: 129
-      buffer_size: 1172
-      learning_rate: 0.005848717855174421
-      beta: 0.0006933626020387194
-      epsilon: 0.0015104254518785796
-      lambd: 0.9809480780691303
       num_epoch: 3
       shared_critic: false
       learning_rate_schedule: linear
@@ -17,16 +17,16 @@ behaviors:
     checkpoint_interval: 50000
     network_settings:
       normalize: false
-      hidden_units: 168
-      num_layers: 3
       vis_encode_type: simple
       memory: null
       goal_conditioning_type: hyper
       deterministic: false
     reward_signals:
       extrinsic:
-        gamma: 0.9417107177844183
-        strength: 0.9576267730399072
         network_settings:
           normalize: false
           hidden_units: 128
@@ -66,7 +66,7 @@ engine_settings:
   no_graphics_monitor: false
 environment_parameters: null
 checkpoint_settings:
-  run_id: SnowballTarget11
   initialize_from: null
   load_model: false
   resume: false

   SnowballTarget:
     trainer_type: ppo
     hyperparameters:
+      batch_size: 255
+      buffer_size: 1051
+      learning_rate: 0.0033585016653676788
+      beta: 0.04458576263259719
+      epsilon: 0.06481103071316076
+      lambd: 0.9200382214218608
       num_epoch: 3
       shared_critic: false
       learning_rate_schedule: linear
     checkpoint_interval: 50000
     network_settings:
       normalize: false
+      hidden_units: 332
+      num_layers: 2
       vis_encode_type: simple
       memory: null
       goal_conditioning_type: hyper
       deterministic: false
     reward_signals:
       extrinsic:
+        gamma: 0.9344680687013123
+        strength: 0.7743161246844508
         network_settings:
           normalize: false
           hidden_units: 128
   no_graphics_monitor: false
 environment_parameters: null
 checkpoint_settings:
+  run_id: SnowballTarget14
   initialize_from: null
   load_model: false
   resume: false

run_logs/Player-0.log CHANGED Viewed

@@ -31,7 +31,7 @@ ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM default
 FMOD failed to initialize the output device.: "Error initializing output device. " (60)
 FMOD initialized on nosound output
 Begin MonoManager ReloadAssembly
-- Completed reload, in  0.153 seconds
 ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
@@ -42,7 +42,7 @@ ERROR: Shader Standard shader is not supported on this GPU (none of subshaders/f
 WARNING: Shader Unsupported: 'Standard' - All subshaders removed
 WARNING: Shader Did you use #pragma only_renderers and omit this platform?
 WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
-UnloadTime: 0.754228 ms
 ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 requesting resize 84 x 84
 Setting up 1 worker threads for Enlighten.
@@ -50,7 +50,7 @@ Memory Statistics:
 [ALLOC_TEMP_TLS] TLS Allocator
   StackAllocators :
     [ALLOC_TEMP_MAIN]
-      Peak usage frame count: [8.0 KB-16.0 KB]: 5371 frames, [16.0 KB-32.0 KB]: 91 frames, [2.0 MB-4.0 MB]: 1 frames
       Initial Block Size 4.0 MB
       Current Block Size 4.0 MB
       Peak Allocated Bytes 2.0 MB
@@ -166,22 +166,22 @@ Memory Statistics:
       Peak Allocated Bytes 0 B
       Overflow Count 0
 [ALLOC_DEFAULT] Dual Thread Allocator
-  Peak main deferred allocation count 37
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_DEFAULT_MAIN]
-      Peak usage frame count: [4.0 MB-8.0 MB]: 5463 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
-      Peak Allocated memory 6.7 MB
       Peak Large allocation bytes 0 B
     [ALLOC_DEFAULT_THREAD]
-      Peak usage frame count: [16.0 MB-32.0 MB]: 5463 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
-      Peak Allocated memory 17.8 MB
       Peak Large allocation bytes 16.0 MB
 [ALLOC_TEMP_JOB_1_FRAME]
   Initial Block Size 2.0 MB
@@ -210,13 +210,13 @@ Memory Statistics:
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_GFX_MAIN]
-      Peak usage frame count: [32.0 KB-64.0 KB]: 5058 frames, [64.0 KB-128.0 KB]: 405 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
-      Peak Allocated memory 66.4 KB
       Peak Large allocation bytes 0 B
     [ALLOC_GFX_THREAD]
-      Peak usage frame count: [32.0 KB-64.0 KB]: 5463 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 39.6 KB
@@ -228,13 +228,13 @@ Memory Statistics:
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_CACHEOBJECTS_MAIN]
-      Peak usage frame count: [0.5 MB-1.0 MB]: 5463 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 0.6 MB
       Peak Large allocation bytes 0 B
     [ALLOC_CACHEOBJECTS_THREAD]
-      Peak usage frame count: [0.5 MB-1.0 MB]: 5462 frames, [2.0 MB-4.0 MB]: 1 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 2.2 MB
@@ -246,13 +246,13 @@ Memory Statistics:
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_TYPETREE_MAIN]
-      Peak usage frame count: [0-1.0 KB]: 5463 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.0 KB
       Peak Large allocation bytes 0 B
     [ALLOC_TYPETREE_THREAD]
-      Peak usage frame count: [1.0 KB-2.0 KB]: 5463 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.7 KB

 FMOD failed to initialize the output device.: "Error initializing output device. " (60)
 FMOD initialized on nosound output
 Begin MonoManager ReloadAssembly
+- Completed reload, in  0.107 seconds
 ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 WARNING: Shader Unsupported: 'Standard' - All subshaders removed
 WARNING: Shader Did you use #pragma only_renderers and omit this platform?
 WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
+UnloadTime: 0.934545 ms
 ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 requesting resize 84 x 84
 Setting up 1 worker threads for Enlighten.
 [ALLOC_TEMP_TLS] TLS Allocator
   StackAllocators :
     [ALLOC_TEMP_MAIN]
+      Peak usage frame count: [8.0 KB-16.0 KB]: 5373 frames, [16.0 KB-32.0 KB]: 91 frames, [2.0 MB-4.0 MB]: 1 frames
       Initial Block Size 4.0 MB
       Current Block Size 4.0 MB
       Peak Allocated Bytes 2.0 MB
       Peak Allocated Bytes 0 B
       Overflow Count 0
 [ALLOC_DEFAULT] Dual Thread Allocator
+  Peak main deferred allocation count 43
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_DEFAULT_MAIN]
+      Peak usage frame count: [4.0 MB-8.0 MB]: 5465 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
+      Peak Allocated memory 6.9 MB
       Peak Large allocation bytes 0 B
     [ALLOC_DEFAULT_THREAD]
+      Peak usage frame count: [16.0 MB-32.0 MB]: 5465 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
+      Peak Allocated memory 17.6 MB
       Peak Large allocation bytes 16.0 MB
 [ALLOC_TEMP_JOB_1_FRAME]
   Initial Block Size 2.0 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_GFX_MAIN]
+      Peak usage frame count: [32.0 KB-64.0 KB]: 4848 frames, [64.0 KB-128.0 KB]: 617 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
+      Peak Allocated memory 67.3 KB
       Peak Large allocation bytes 0 B
     [ALLOC_GFX_THREAD]
+      Peak usage frame count: [32.0 KB-64.0 KB]: 5465 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 39.6 KB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_CACHEOBJECTS_MAIN]
+      Peak usage frame count: [0.5 MB-1.0 MB]: 5465 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 0.6 MB
       Peak Large allocation bytes 0 B
     [ALLOC_CACHEOBJECTS_THREAD]
+      Peak usage frame count: [0.5 MB-1.0 MB]: 5464 frames, [2.0 MB-4.0 MB]: 1 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 2.2 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_TYPETREE_MAIN]
+      Peak usage frame count: [0-1.0 KB]: 5465 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.0 KB
       Peak Large allocation bytes 0 B
     [ALLOC_TYPETREE_THREAD]
+      Peak usage frame count: [1.0 KB-2.0 KB]: 5465 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.7 KB

run_logs/timers.json CHANGED Viewed

@@ -2,15 +2,15 @@
     "name": "root",
     "gauges": {
         "SnowballTarget.Policy.Entropy.mean": {
-            "value": 1.6439284086227417,
-            "min": 1.6439284086227417,
-            "max": 2.8902804851531982,
             "count": 20
         },
         "SnowballTarget.Policy.Entropy.sum": {
-            "value": 15840.89453125,
-            "min": 15840.89453125,
-            "max": 29758.328125,
             "count": 20
         },
         "SnowballTarget.Step.mean": {
@@ -26,15 +26,15 @@
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
-            "value": 1.9428905248641968,
-            "min": 0.1823497712612152,
-            "max": 1.9428905248641968,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
-            "value": 378.8636474609375,
-            "min": 35.3758544921875,
-            "max": 380.93072509765625,
             "count": 20
         },
         "SnowballTarget.Environment.EpisodeLength.mean": {
@@ -50,87 +50,87 @@
             "count": 20
         },
         "SnowballTarget.Losses.PolicyLoss.mean": {
-            "value": 0.06267216122382648,
-            "min": 0.055472424205818945,
-            "max": 0.07582000890679685,
             "count": 20
         },
         "SnowballTarget.Losses.PolicyLoss.sum": {
-            "value": 0.43870512856678534,
-            "min": 0.3883069694407326,
-            "max": 0.5136208887223149,
             "count": 20
         },
         "SnowballTarget.Losses.ValueLoss.mean": {
-            "value": 0.136476278666294,
-            "min": 0.058655292562828594,
-            "max": 0.16762607907513521,
             "count": 20
         },
         "SnowballTarget.Losses.ValueLoss.sum": {
-            "value": 0.9553339506640579,
-            "min": 0.41058704793980016,
-            "max": 1.1733825535259466,
             "count": 20
         },
         "SnowballTarget.Policy.LearningRate.mean": {
-            "value": 0.00014598409516915355,
-            "min": 0.00014598409516915355,
-            "max": 0.005700316389999796,
             "count": 20
         },
         "SnowballTarget.Policy.LearningRate.sum": {
-            "value": 0.0010218886661840748,
-            "min": 0.0010218886661840748,
-            "max": 0.037950692572355366,
             "count": 20
         },
         "SnowballTarget.Policy.Epsilon.mean": {
-            "value": 0.09754170021927888,
-            "min": 0.004009434256746251,
-            "max": 0.09754170021927888,
             "count": 20
         },
         "SnowballTarget.Policy.Epsilon.sum": {
-            "value": 0.6827919015349522,
-            "min": 0.024056605540477505,
-            "max": 0.6827919015349522,
             "count": 20
         },
         "SnowballTarget.Policy.Beta.mean": {
-            "value": 2.7056730546886436e-05,
-            "min": 2.7056730546886436e-05,
-            "max": 0.0006760234149496571,
             "count": 20
         },
         "SnowballTarget.Policy.Beta.sum": {
-            "value": 0.00018939711382820506,
-            "min": 0.00018939711382820506,
-            "max": 0.00450414858310068,
             "count": 20
         },
         "SnowballTarget.Environment.CumulativeReward.mean": {
-            "value": 23.386363636363637,
-            "min": 2.6545454545454548,
-            "max": 23.386363636363637,
             "count": 20
         },
         "SnowballTarget.Environment.CumulativeReward.sum": {
-            "value": 1029.0,
-            "min": 124.0,
-            "max": 1227.0,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicReward.mean": {
-            "value": 22.395407249981705,
-            "min": 2.54206375208768,
-            "max": 22.395407249981705,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicReward.sum": {
-            "value": 985.3979189991951,
-            "min": 118.74571794271469,
-            "max": 1175.0080181956291,
             "count": 20
         },
         "SnowballTarget.IsTraining.mean": {
@@ -148,67 +148,67 @@
     },
     "metadata": {
         "timer_format_version": "0.1.0",
-        "start_time_seconds": "1734645837",
         "python_version": "3.10.12 (main, Nov  6 2024, 20:22:13) [GCC 11.4.0]",
-        "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget11 --no-graphics --force",
         "mlagents_version": "1.2.0.dev0",
         "mlagents_envs_version": "1.2.0.dev0",
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "2.5.1+cu121",
         "numpy_version": "1.23.5",
-        "end_time_seconds": "1734646329"
     },
-    "total": 492.4546862169991,
     "count": 1,
-    "self": 0.5267043589992682,
     "children": {
         "run_training.setup": {
-            "total": 0.10980674199890927,
             "count": 1,
-            "self": 0.10980674199890927
         },
         "TrainerController.start_learning": {
-            "total": 491.81817511600093,
             "count": 1,
-            "self": 0.8021783462972962,
             "children": {
                 "TrainerController._reset_env": {
-                    "total": 2.2097316759973182,
                     "count": 1,
-                    "self": 2.2097316759973182
                 },
                 "TrainerController.advance": {
-                    "total": 488.7256403117026,
-                    "count": 18209,
-                    "self": 0.372184840925911,
                     "children": {
                         "env_step": {
-                            "total": 488.3534554707767,
-                            "count": 18209,
-                            "self": 361.6315583955293,
                             "children": {
                                 "SubprocessEnvManager._take_step": {
-                                    "total": 126.34392291447875,
-                                    "count": 18209,
-                                    "self": 2.022507725367177,
                                     "children": {
                                         "TorchPolicy.evaluate": {
-                                            "total": 124.32141518911158,
-                                            "count": 18209,
-                                            "self": 124.32141518911158
                                         }
                                     }
                                 },
                                 "workers": {
-                                    "total": 0.37797416076864465,
-                                    "count": 18209,
                                     "self": 0.0,
                                     "children": {
                                         "worker_root": {
-                                            "total": 490.0476761838072,
-                                            "count": 18209,
                                             "is_parallel": true,
-                                            "self": 216.11597017761596,
                                             "children": {
                                                 "run_training.setup": {
                                                     "total": 0.0,
@@ -217,48 +217,48 @@
                                                     "self": 0.0,
                                                     "children": {
                                                         "steps_from_proto": {
-                                                            "total": 0.0025727829997777008,
                                                             "count": 1,
                                                             "is_parallel": true,
-                                                            "self": 0.0007713410050200764,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
-                                                                    "total": 0.0018014419947576243,
                                                                     "count": 10,
                                                                     "is_parallel": true,
-                                                                    "self": 0.0018014419947576243
                                                                 }
                                                             }
                                                         },
                                                         "UnityEnvironment.step": {
-                                                            "total": 0.04092625699922792,
                                                             "count": 1,
                                                             "is_parallel": true,
-                                                            "self": 0.0008045159993343987,
                                                             "children": {
                                                                 "UnityEnvironment._generate_step_input": {
-                                                                    "total": 0.000446805999672506,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.000446805999672506
                                                                 },
                                                                 "communicator.exchange": {
-                                                                    "total": 0.037390420999145135,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.037390420999145135
                                                                 },
                                                                 "steps_from_proto": {
-                                                                    "total": 0.002284514001075877,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.0004699480050476268,
                                                                     "children": {
                                                                         "_process_rank_one_or_two_observation": {
-                                                                            "total": 0.00181456599602825,
                                                                             "count": 10,
                                                                             "is_parallel": true,
-                                                                            "self": 0.00181456599602825
                                                                         }
                                                                     }
                                                                 }
@@ -267,34 +267,34 @@
                                                     }
                                                 },
                                                 "UnityEnvironment.step": {
-                                                    "total": 273.93170600619123,
-                                                    "count": 18208,
                                                     "is_parallel": true,
-                                                    "self": 12.34132495736776,
                                                     "children": {
                                                         "UnityEnvironment._generate_step_input": {
-                                                            "total": 6.28572836901003,
-                                                            "count": 18208,
                                                             "is_parallel": true,
-                                                            "self": 6.28572836901003
                                                         },
                                                         "communicator.exchange": {
-                                                            "total": 215.35456801667533,
-                                                            "count": 18208,
                                                             "is_parallel": true,
-                                                            "self": 215.35456801667533
                                                         },
                                                         "steps_from_proto": {
-                                                            "total": 39.950084663138114,
-                                                            "count": 18208,
                                                             "is_parallel": true,
-                                                            "self": 7.68151135008884,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
-                                                                    "total": 32.268573313049274,
-                                                                    "count": 182080,
                                                                     "is_parallel": true,
-                                                                    "self": 32.268573313049274
                                                                 }
                                                             }
                                                         }
@@ -309,9 +309,9 @@
                     }
                 },
                 "trainer_threads": {
-                    "total": 0.0003680500012706034,
                     "count": 1,
-                    "self": 0.0003680500012706034,
                     "children": {
                         "thread_root": {
                             "total": 0.0,
@@ -320,36 +320,36 @@
                             "self": 0.0,
                             "children": {
                                 "trainer_advance": {
-                                    "total": 485.92623232954793,
-                                    "count": 372338,
                                     "is_parallel": true,
-                                    "self": 8.142840825508756,
                                     "children": {
                                         "process_trajectory": {
-                                            "total": 182.39031493504444,
-                                            "count": 372338,
                                             "is_parallel": true,
-                                            "self": 181.79515693904614,
                                             "children": {
                                                 "RLTrainer._checkpoint": {
-                                                    "total": 0.5951579959983064,
                                                     "count": 4,
                                                     "is_parallel": true,
-                                                    "self": 0.5951579959983064
                                                 }
                                             }
                                         },
                                         "_update_policy": {
-                                            "total": 295.39307656899473,
-                                            "count": 136,
                                             "is_parallel": true,
-                                            "self": 83.54235101915401,
                                             "children": {
                                                 "TorchPPOOptimizer.update": {
-                                                    "total": 211.85072554984072,
-                                                    "count": 4353,
                                                     "is_parallel": true,
-                                                    "self": 211.85072554984072
                                                 }
                                             }
                                         }
@@ -360,14 +360,14 @@
                     }
                 },
                 "TrainerController._save_models": {
-                    "total": 0.08025673200245365,
                     "count": 1,
-                    "self": 0.0012775960021826904,
                     "children": {
                         "RLTrainer._checkpoint": {
-                            "total": 0.07897913600027096,
                             "count": 1,
-                            "self": 0.07897913600027096
                         }
                     }
                 }

     "name": "root",
     "gauges": {
         "SnowballTarget.Policy.Entropy.mean": {
+            "value": 1.602304458618164,
+            "min": 1.602304458618164,
+            "max": 2.8853836059570312,
             "count": 20
         },
         "SnowballTarget.Policy.Entropy.sum": {
+            "value": 15475.056640625,
+            "min": 15475.056640625,
+            "max": 29549.212890625,
             "count": 20
         },
         "SnowballTarget.Step.mean": {
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
+            "value": 1.462786078453064,
+            "min": 0.20903053879737854,
+            "max": 1.462786078453064,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
+            "value": 285.2432861328125,
+            "min": 40.55192565917969,
+            "max": 295.2460021972656,
             "count": 20
         },
         "SnowballTarget.Environment.EpisodeLength.mean": {
             "count": 20
         },
         "SnowballTarget.Losses.PolicyLoss.mean": {
+            "value": 0.04278062743071046,
+            "min": 0.03740328233245583,
+            "max": 0.05381372995640656,
             "count": 20
         },
         "SnowballTarget.Losses.PolicyLoss.sum": {
+            "value": 0.2994643920149732,
+            "min": 0.25109103050393367,
+            "max": 0.3492709052506447,
             "count": 20
         },
         "SnowballTarget.Losses.ValueLoss.mean": {
+            "value": 0.064781530272393,
+            "min": 0.0370886461454488,
+            "max": 0.09625423115988573,
             "count": 20
         },
         "SnowballTarget.Losses.ValueLoss.sum": {
+            "value": 0.45347071190675103,
+            "min": 0.2596205230181416,
+            "max": 0.5775253869593143,
             "count": 20
         },
         "SnowballTarget.Policy.LearningRate.mean": {
+            "value": 8.382829907157725e-05,
+            "min": 8.382829907157725e-05,
+            "max": 0.0032732852856490837,
             "count": 20
         },
         "SnowballTarget.Policy.LearningRate.sum": {
+            "value": 0.0005867980935010407,
+            "min": 0.0005867980935010407,
+            "max": 0.021797750579737155,
             "count": 20
         },
         "SnowballTarget.Policy.Epsilon.mean": {
+            "value": 0.09912168332660047,
+            "min": 0.06570389216053214,
+            "max": 0.09912168332660047,
             "count": 20
         },
         "SnowballTarget.Policy.Epsilon.sum": {
+            "value": 0.6938517832862033,
+            "min": 0.3942233529631929,
+            "max": 0.6938517832862033,
             "count": 20
         },
         "SnowballTarget.Policy.Beta.mean": {
+            "value": 0.0011226110353096256,
+            "min": 0.0011226110353096256,
+            "max": 0.04345472694873276,
             "count": 20
         },
         "SnowballTarget.Policy.Beta.sum": {
+            "value": 0.007858277247167379,
+            "min": 0.007858277247167379,
+            "max": 0.2893809637295982,
             "count": 20
         },
         "SnowballTarget.Environment.CumulativeReward.mean": {
+            "value": 24.386363636363637,
+            "min": 3.022727272727273,
+            "max": 24.386363636363637,
             "count": 20
         },
         "SnowballTarget.Environment.CumulativeReward.sum": {
+            "value": 1073.0,
+            "min": 133.0,
+            "max": 1335.0,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicReward.mean": {
+            "value": 18.882754775610838,
+            "min": 2.3405465077270162,
+            "max": 18.882754775610838,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicReward.sum": {
+            "value": 830.8412101268768,
+            "min": 102.98404633998871,
+            "max": 1033.712035536766,
             "count": 20
         },
         "SnowballTarget.IsTraining.mean": {
     },
     "metadata": {
         "timer_format_version": "0.1.0",
+        "start_time_seconds": "1734712356",
         "python_version": "3.10.12 (main, Nov  6 2024, 20:22:13) [GCC 11.4.0]",
+        "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget14 --no-graphics --force",
         "mlagents_version": "1.2.0.dev0",
         "mlagents_envs_version": "1.2.0.dev0",
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "2.5.1+cu121",
         "numpy_version": "1.23.5",
+        "end_time_seconds": "1734712934"
     },
+    "total": 578.3493716190005,
     "count": 1,
+    "self": 1.054238938000708,
     "children": {
         "run_training.setup": {
+            "total": 0.0741157310003473,
             "count": 1,
+            "self": 0.0741157310003473
         },
         "TrainerController.start_learning": {
+            "total": 577.2210169499995,
             "count": 1,
+            "self": 1.023016461919724,
             "children": {
                 "TrainerController._reset_env": {
+                    "total": 3.221277755000301,
                     "count": 1,
+                    "self": 3.221277755000301
                 },
                 "TrainerController.advance": {
+                    "total": 572.8177740130795,
+                    "count": 18215,
+                    "self": 0.4886110569404991,
                     "children": {
                         "env_step": {
+                            "total": 572.329162956139,
+                            "count": 18215,
+                            "self": 412.958888128067,
                             "children": {
                                 "SubprocessEnvManager._take_step": {
+                                    "total": 158.93467012807014,
+                                    "count": 18215,
+                                    "self": 3.019371363108803,
                                     "children": {
                                         "TorchPolicy.evaluate": {
+                                            "total": 155.91529876496134,
+                                            "count": 18215,
+                                            "self": 155.91529876496134
                                         }
                                     }
                                 },
                                 "workers": {
+                                    "total": 0.43560470000193163,
+                                    "count": 18215,
                                     "self": 0.0,
                                     "children": {
                                         "worker_root": {
+                                            "total": 574.958547064989,
+                                            "count": 18215,
                                             "is_parallel": true,
+                                            "self": 249.5135799089685,
                                             "children": {
                                                 "run_training.setup": {
                                                     "total": 0.0,
                                                     "self": 0.0,
                                                     "children": {
                                                         "steps_from_proto": {
+                                                            "total": 0.003545269999449374,
                                                             "count": 1,
                                                             "is_parallel": true,
+                                                            "self": 0.0008927559983931133,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
+                                                                    "total": 0.002652514001056261,
                                                                     "count": 10,
                                                                     "is_parallel": true,
+                                                                    "self": 0.002652514001056261
                                                                 }
                                                             }
                                                         },
                                                         "UnityEnvironment.step": {
+                                                            "total": 0.1095645350005725,
                                                             "count": 1,
                                                             "is_parallel": true,
+                                                            "self": 0.0008891070010577096,
                                                             "children": {
                                                                 "UnityEnvironment._generate_step_input": {
+                                                                    "total": 0.00045683400003326824,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.00045683400003326824
                                                                 },
                                                                 "communicator.exchange": {
+                                                                    "total": 0.10594400099944323,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.10594400099944323
                                                                 },
                                                                 "steps_from_proto": {
+                                                                    "total": 0.002274593000038294,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.0004177509981673211,
                                                                     "children": {
                                                                         "_process_rank_one_or_two_observation": {
+                                                                            "total": 0.001856842001870973,
                                                                             "count": 10,
                                                                             "is_parallel": true,
+                                                                            "self": 0.001856842001870973
                                                                         }
                                                                     }
                                                                 }
                                                     }
                                                 },
                                                 "UnityEnvironment.step": {
+                                                    "total": 325.44496715602054,
+                                                    "count": 18214,
                                                     "is_parallel": true,
+                                                    "self": 15.366280455989,
                                                     "children": {
                                                         "UnityEnvironment._generate_step_input": {
+                                                            "total": 7.844114936006918,
+                                                            "count": 18214,
                                                             "is_parallel": true,
+                                                            "self": 7.844114936006918
                                                         },
                                                         "communicator.exchange": {
+                                                            "total": 255.65704095400451,
+                                                            "count": 18214,
                                                             "is_parallel": true,
+                                                            "self": 255.65704095400451
                                                         },
                                                         "steps_from_proto": {
+                                                            "total": 46.57753081002011,
+                                                            "count": 18214,
                                                             "is_parallel": true,
+                                                            "self": 9.352727159182905,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
+                                                                    "total": 37.2248036508372,
+                                                                    "count": 182140,
                                                                     "is_parallel": true,
+                                                                    "self": 37.2248036508372
                                                                 }
                                                             }
                                                         }
                     }
                 },
                 "trainer_threads": {
+                    "total": 0.0003579949998311349,
                     "count": 1,
+                    "self": 0.0003579949998311349,
                     "children": {
                         "thread_root": {
                             "total": 0.0,
                             "self": 0.0,
                             "children": {
                                 "trainer_advance": {
+                                    "total": 568.5701288763703,
+                                    "count": 516846,
                                     "is_parallel": true,
+                                    "self": 12.44683584858194,
                                     "children": {
                                         "process_trajectory": {
+                                            "total": 251.86072053578755,
+                                            "count": 516846,
                                             "is_parallel": true,
+                                            "self": 250.94444069578822,
                                             "children": {
                                                 "RLTrainer._checkpoint": {
+                                                    "total": 0.9162798399993335,
                                                     "count": 4,
                                                     "is_parallel": true,
+                                                    "self": 0.9162798399993335
                                                 }
                                             }
                                         },
                                         "_update_policy": {
+                                            "total": 304.2625724920008,
+                                            "count": 137,
                                             "is_parallel": true,
+                                            "self": 84.32923142198342,
                                             "children": {
                                                 "TorchPPOOptimizer.update": {
+                                                    "total": 219.93334107001738,
+                                                    "count": 2046,
                                                     "is_parallel": true,
+                                                    "self": 219.93334107001738
                                                 }
                                             }
                                         }
                     }
                 },
                 "TrainerController._save_models": {
+                    "total": 0.15859072500006732,
                     "count": 1,
+                    "self": 0.0022051480000300216,
                     "children": {
                         "RLTrainer._checkpoint": {
+                            "total": 0.1563855770000373,
                             "count": 1,
+                            "self": 0.1563855770000373
                         }
                     }
                 }

run_logs/training_status.json CHANGED Viewed

@@ -3,57 +3,57 @@
         "checkpoints": [
             {
                 "steps": 49936,
-                "file_path": "results/SnowballTarget11/SnowballTarget/SnowballTarget-49936.onnx",
                 "reward": null,
-                "creation_time": 1734645962.7687764,
                 "auxillary_file_paths": [
-                    "results/SnowballTarget11/SnowballTarget/SnowballTarget-49936.pt"
                 ]
             },
             {
                 "steps": 99960,
-                "file_path": "results/SnowballTarget11/SnowballTarget/SnowballTarget-99960.onnx",
                 "reward": null,
-                "creation_time": 1734646085.8705854,
                 "auxillary_file_paths": [
-                    "results/SnowballTarget11/SnowballTarget/SnowballTarget-99960.pt"
                 ]
             },
             {
                 "steps": 149984,
-                "file_path": "results/SnowballTarget11/SnowballTarget/SnowballTarget-149984.onnx",
-                "reward": 17.272727272727273,
-                "creation_time": 1734646206.798937,
                 "auxillary_file_paths": [
-                    "results/SnowballTarget11/SnowballTarget/SnowballTarget-149984.pt"
                 ]
             },
             {
                 "steps": 199984,
-                "file_path": "results/SnowballTarget11/SnowballTarget/SnowballTarget-199984.onnx",
                 "reward": null,
-                "creation_time": 1734646329.3024094,
                 "auxillary_file_paths": [
-                    "results/SnowballTarget11/SnowballTarget/SnowballTarget-199984.pt"
                 ]
             },
             {
                 "steps": 200184,
-                "file_path": "results/SnowballTarget11/SnowballTarget/SnowballTarget-200184.onnx",
-                "reward": 23.88888888888889,
-                "creation_time": 1734646329.4213703,
                 "auxillary_file_paths": [
-                    "results/SnowballTarget11/SnowballTarget/SnowballTarget-200184.pt"
                 ]
             }
         ],
         "final_checkpoint": {
             "steps": 200184,
-            "file_path": "results/SnowballTarget11/SnowballTarget.onnx",
-            "reward": 23.88888888888889,
-            "creation_time": 1734646329.4213703,
             "auxillary_file_paths": [
-                "results/SnowballTarget11/SnowballTarget/SnowballTarget-200184.pt"
             ]
         }
     },

         "checkpoints": [
             {
                 "steps": 49936,
+                "file_path": "results/SnowballTarget14/SnowballTarget/SnowballTarget-49936.onnx",
                 "reward": null,
+                "creation_time": 1734712502.5868247,
                 "auxillary_file_paths": [
+                    "results/SnowballTarget14/SnowballTarget/SnowballTarget-49936.pt"
                 ]
             },
             {
                 "steps": 99960,
+                "file_path": "results/SnowballTarget14/SnowballTarget/SnowballTarget-99960.onnx",
                 "reward": null,
+                "creation_time": 1734712646.3182104,
                 "auxillary_file_paths": [
+                    "results/SnowballTarget14/SnowballTarget/SnowballTarget-99960.pt"
                 ]
             },
             {
                 "steps": 149984,
+                "file_path": "results/SnowballTarget14/SnowballTarget/SnowballTarget-149984.onnx",
+                "reward": 18.90909090909091,
+                "creation_time": 1734712788.6093626,
                 "auxillary_file_paths": [
+                    "results/SnowballTarget14/SnowballTarget/SnowballTarget-149984.pt"
                 ]
             },
             {
                 "steps": 199984,
+                "file_path": "results/SnowballTarget14/SnowballTarget/SnowballTarget-199984.onnx",
                 "reward": null,
+                "creation_time": 1734712933.5976007,
                 "auxillary_file_paths": [
+                    "results/SnowballTarget14/SnowballTarget/SnowballTarget-199984.pt"
                 ]
             },
             {
                 "steps": 200184,
+                "file_path": "results/SnowballTarget14/SnowballTarget/SnowballTarget-200184.onnx",
+                "reward": 24.666666666666668,
+                "creation_time": 1734712933.8229642,
                 "auxillary_file_paths": [
+                    "results/SnowballTarget14/SnowballTarget/SnowballTarget-200184.pt"
                 ]
             }
         ],
         "final_checkpoint": {
             "steps": 200184,
+            "file_path": "results/SnowballTarget14/SnowballTarget.onnx",
+            "reward": 24.666666666666668,
+            "creation_time": 1734712933.8229642,
             "auxillary_file_paths": [
+                "results/SnowballTarget14/SnowballTarget/SnowballTarget-200184.pt"
             ]
         }
     },