cheetahbooked commited on May 21, 2025

Commit

c77a7bc

verified ·

1 Parent(s): 6863d9d

First Push

Browse files

Files changed (19) hide show

README.md +4 -4
SnowballTarget.onnx +3 -0
SnowballTarget/SnowballTarget-149984.onnx +3 -0
SnowballTarget/SnowballTarget-149984.pt +3 -0
SnowballTarget/SnowballTarget-199984.onnx +3 -0
SnowballTarget/SnowballTarget-199984.pt +3 -0
SnowballTarget/SnowballTarget-200112.onnx +3 -0
SnowballTarget/SnowballTarget-200112.pt +3 -0
SnowballTarget/SnowballTarget-49936.onnx +3 -0
SnowballTarget/SnowballTarget-49936.pt +3 -0
SnowballTarget/SnowballTarget-99960.onnx +3 -0
SnowballTarget/SnowballTarget-99960.pt +3 -0
SnowballTarget/checkpoint.pt +3 -0
SnowballTarget/events.out.tfevents.1747865206.129fa92bc555.1882.0 +3 -0
config.json +1 -1
configuration.yaml +10 -23
run_logs/Player-0.log +63 -118
run_logs/timers.json +193 -229
run_logs/training_status.json +31 -31

README.md CHANGED Viewed

@@ -1,14 +1,14 @@
 ---
 library_name: ml-agents
 tags:
-- Pyramids
 - deep-reinforcement-learning
 - reinforcement-learning
-- ML-Agents-Pyramids
 ---
-  # **ppo** Agent playing **Pyramids**
-  This is a trained model of a **ppo** agent playing **Pyramids**
   using the [Unity ML-Agents Library](https://github.com/Unity-Technologies/ml-agents).
   ## Usage (with ML-Agents)

 ---
 library_name: ml-agents
 tags:
+- SnowballTarget
 - deep-reinforcement-learning
 - reinforcement-learning
+- ML-Agents-SnowballTarget
 ---
+  # **ppo** Agent playing **SnowballTarget**
+  This is a trained model of a **ppo** agent playing **SnowballTarget**
   using the [Unity ML-Agents Library](https://github.com/Unity-Technologies/ml-agents).
   ## Usage (with ML-Agents)

SnowballTarget.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f6700453b02a4a6da65600594f886a8637fd78ddc62f291f33a805b8107eedec
+size 650646

SnowballTarget/SnowballTarget-149984.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c96b5cbeb3df3c1a4b919853babbb0d6425c4e41638a0812f59510acc9cccc2f
+size 650646

SnowballTarget/SnowballTarget-149984.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:12427012d8edb458745087fc61f08ca1fe1f634719b2fbeb5b421446e2cc25f0
+size 3850564

SnowballTarget/SnowballTarget-199984.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f6700453b02a4a6da65600594f886a8637fd78ddc62f291f33a805b8107eedec
+size 650646

SnowballTarget/SnowballTarget-199984.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c0bc8342658d62d00827ed8af0ff617db6e5e828f770e22b2771f7517c72d9e4
+size 3850564

SnowballTarget/SnowballTarget-200112.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f6700453b02a4a6da65600594f886a8637fd78ddc62f291f33a805b8107eedec
+size 650646

SnowballTarget/SnowballTarget-200112.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f7e74a633c23889f75e3431d88319033eb01649245a8eab9041cb5797cb6af34
+size 3850564

SnowballTarget/SnowballTarget-49936.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d1a30061a7e2d89172a24095fa5f9f0572c4f6d204b3c25de23bb503607ebc56
+size 650646

SnowballTarget/SnowballTarget-49936.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a20914b9bddce69bc2c75834acd4325a163bfebfc6bc4a74d2598228b41ed69b
+size 3850487

SnowballTarget/SnowballTarget-99960.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ae24bdf6a58c8712933a3efe7c65c09972fbae2eecebc9e6e4063eb7cdce57cb
+size 650646

SnowballTarget/SnowballTarget-99960.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:96f3c6bf3708e3c228422909d3a4f19c27477644011c06a1b99022bc856683ac
+size 3850487

SnowballTarget/checkpoint.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:78ca460b7e30d4edaff49faa69743880627868d956c463747b08c6404144aa89
+size 3849717

SnowballTarget/events.out.tfevents.1747865206.129fa92bc555.1882.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e9424ccff8976ad75c7e7c0b7ce45e90966eee5251f54d73d7771e9bf28efaf5
+size 23493

config.json CHANGED Viewed

@@ -1 +1 @@

- {"default_settings": null, "behaviors": {"~~Pyramids~~": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 128, "buffer_size": 2048, "learning_rate": 0.0003, "beta": 0.01, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": ~~500000~~, "network_settings": {"normalize": false, "hidden_units": ~~512~~, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}, "rnd": {"gamma": 0.99, "strength": 0.01, "network_settings": {"normalize": false, "hidden_units": 64, "num_layers": 3, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "~~learning_rate": 0.0001, "encoding_size": null}}, "~~init_path": null, "keep_checkpoints": 5, "even_checkpoints": false, "max_steps": ~~3000000~~, "time_horizon": ~~128~~, "summary_freq": ~~30000~~, "threaded": false, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/~~Pyramids~~/~~Pyramids~~", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "~~Pyramids Training~~", "initialize_from": null, "load_model": false, "resume": false, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

+ {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 128, "buffer_size": 2048, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 50000, "network_settings": {"normalize": false, "hidden_units": 256, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "even_checkpoints": false, "max_steps": 200000, "time_horizon": 64, "summary_freq": 10000, "threaded": false, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SnowballTarget/SnowballTarget", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SnowballTarget1", "initialize_from": null, "load_model": false, "resume": false, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

configuration.yaml CHANGED Viewed

@@ -1,12 +1,12 @@
 default_settings: null
 behaviors:
-  Pyramids:
     trainer_type: ppo
     hyperparameters:
       batch_size: 128
       buffer_size: 2048
       learning_rate: 0.0003
-      beta: 0.01
       epsilon: 0.2
       lambd: 0.95
       num_epoch: 3
@@ -14,10 +14,10 @@ behaviors:
       learning_rate_schedule: linear
       beta_schedule: linear
       epsilon_schedule: linear
-    checkpoint_interval: 500000
     network_settings:
       normalize: false
-      hidden_units: 512
       num_layers: 2
       vis_encode_type: simple
       memory: null
@@ -35,30 +35,17 @@ behaviors:
           memory: null
           goal_conditioning_type: hyper
           deterministic: false
-      rnd:
-        gamma: 0.99
-        strength: 0.01
-        network_settings:
-          normalize: false
-          hidden_units: 64
-          num_layers: 3
-          vis_encode_type: simple
-          memory: null
-          goal_conditioning_type: hyper
-          deterministic: false
-        learning_rate: 0.0001
-        encoding_size: null
     init_path: null
-    keep_checkpoints: 5
     even_checkpoints: false
-    max_steps: 3000000
-    time_horizon: 128
-    summary_freq: 30000
     threaded: false
     self_play: null
     behavioral_cloning: null
 env_settings:
-  env_path: ./training-envs-executables/linux/Pyramids/Pyramids
   env_args: null
   base_port: 5005
   num_envs: 1
@@ -79,7 +66,7 @@ engine_settings:
   no_graphics_monitor: false
 environment_parameters: null
 checkpoint_settings:
-  run_id: Pyramids Training
   initialize_from: null
   load_model: false
   resume: false

 default_settings: null
 behaviors:
+  SnowballTarget:
     trainer_type: ppo
     hyperparameters:
       batch_size: 128
       buffer_size: 2048
       learning_rate: 0.0003
+      beta: 0.005
       epsilon: 0.2
       lambd: 0.95
       num_epoch: 3
       learning_rate_schedule: linear
       beta_schedule: linear
       epsilon_schedule: linear
+    checkpoint_interval: 50000
     network_settings:
       normalize: false
+      hidden_units: 256
       num_layers: 2
       vis_encode_type: simple
       memory: null
           memory: null
           goal_conditioning_type: hyper
           deterministic: false
     init_path: null
+    keep_checkpoints: 10
     even_checkpoints: false
+    max_steps: 200000
+    time_horizon: 64
+    summary_freq: 10000
     threaded: false
     self_play: null
     behavioral_cloning: null
 env_settings:
+  env_path: ./training-envs-executables/linux/SnowballTarget/SnowballTarget
   env_args: null
   base_port: 5005
   num_envs: 1
   no_graphics_monitor: false
 environment_parameters: null
 checkpoint_settings:
+  run_id: SnowballTarget1
   initialize_from: null
   load_model: false
   resume: false

run_logs/Player-0.log CHANGED Viewed

@@ -1,14 +1,12 @@
-Mono path[0] = '/content/ml-agents/training-envs-executables/linux/Pyramids/Pyramids_Data/Managed'
-Mono config path = '/content/ml-agents/training-envs-executables/linux/Pyramids/Pyramids_Data/MonoBleedingEdge/etc'
-Found 1 interfaces on host : 0) 172.28.0.12
-Multi-casting "[IP] 172.28.0.12 [Port] 55052 [Flags] 2 [Guid] 4089059672 [EditorId] 764847374 [Version] 1048832 [Id] LinuxPlayer(13,172.28.0.12) [Debug] 0 [PackageName] LinuxPlayer [ProjectName] UnityEnvironment" to [225.0.0.222:54997]...
 Preloaded 'lib_burst_generated.so'
 Preloaded 'libgrpc_csharp_ext.x64.so'
-PlayerPrefs - Creating folder: /root/.config/unity3d/Unity Technologies
-PlayerPrefs - Creating folder: /root/.config/unity3d/Unity Technologies/UnityEnvironment
 Unable to load player prefs
-Initialize engine version: 2021.3.5f1 (40eb3a945986)
-[Subsystems] Discovering subsystems at path /content/ml-agents/training-envs-executables/linux/Pyramids/Pyramids_Data/UnitySubsystems
 Forcing GfxDevice: Null
 GfxDevice: creating device client; threaded=0; jobified=0
 NullGfxDevice:
@@ -36,31 +34,10 @@ ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM default
 FMOD failed to initialize the output device.: "Error initializing output device. " (60)
 FMOD initialized on nosound output
 Begin MonoManager ReloadAssembly
-- Completed reload, in  0.088 seconds
 ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
-WARNING: Shader Unsupported: 'Autodesk Interactive' - All subshaders removed
-WARNING: Shader Did you use #pragma only_renderers and omit this platform?
-WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
-ERROR: Shader Autodesk Interactive shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
-WARNING: Shader Unsupported: 'Autodesk Interactive' - All subshaders removed
-WARNING: Shader Did you use #pragma only_renderers and omit this platform?
-WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
-WARNING: Shader Unsupported: 'Legacy Shaders/Diffuse' - All subshaders removed
-WARNING: Shader Did you use #pragma only_renderers and omit this platform?
-WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
-ERROR: Shader Legacy Shaders/Diffuse shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
-WARNING: Shader Unsupported: 'Legacy Shaders/Diffuse' - All subshaders removed
-WARNING: Shader Did you use #pragma only_renderers and omit this platform?
-WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
-WARNING: Shader Unsupported: 'ML-Agents/GridPattern' - All subshaders removed
-WARNING: Shader Did you use #pragma only_renderers and omit this platform?
-WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
-ERROR: Shader ML-Agents/GridPattern shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
-WARNING: Shader Unsupported: 'ML-Agents/GridPattern' - All subshaders removed
-WARNING: Shader Did you use #pragma only_renderers and omit this platform?
-WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
 WARNING: Shader Unsupported: 'Standard' - All subshaders removed
 WARNING: Shader Did you use #pragma only_renderers and omit this platform?
 WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
@@ -68,90 +45,85 @@ ERROR: Shader Standard shader is not supported on this GPU (none of subshaders/f
 WARNING: Shader Unsupported: 'Standard' - All subshaders removed
 WARNING: Shader Did you use #pragma only_renderers and omit this platform?
 WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
-UnloadTime: 0.804626 ms
 ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 requesting resize 84 x 84
 Setting up 1 worker threads for Enlighten.
-PlayerConnection::CleanupMemory Statistics:
 [ALLOC_TEMP_TLS] TLS Allocator
   StackAllocators :
     [ALLOC_TEMP_MAIN]
-      Peak usage frame count: [16.0 KB-32.0 KB]: 8110 frames, [32.0 KB-64.0 KB]: 24375 frames, [64.0 KB-128.0 KB]: 10825 frames, [2.0 MB-4.0 MB]: 1 frames
       Initial Block Size 4.0 MB
       Current Block Size 4.0 MB
       Peak Allocated Bytes 2.0 MB
       Overflow Count 0
     [ALLOC_TEMP_Background Job.Worker 8]
       Initial Block Size 32.0 KB
       Current Block Size 32.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
-    [ALLOC_TEMP_Background Job.Worker 10]
       Initial Block Size 32.0 KB
       Current Block Size 32.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
-    [ALLOC_TEMP_Background Job.Worker 6]
       Initial Block Size 32.0 KB
       Current Block Size 32.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
-    [ALLOC_TEMP_AUDIO_FMOD mixer thread]
-      Initial Block Size 64.0 KB
-      Current Block Size 64.0 KB
-      Peak Allocated Bytes 0 B
-      Overflow Count 0
-    [ALLOC_TEMP_Background Job.Worker 1]
       Initial Block Size 32.0 KB
       Current Block Size 32.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
-    [ALLOC_TEMP_Background Job.Worker 11]
       Initial Block Size 32.0 KB
       Current Block Size 32.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
-    [ALLOC_TEMP_Background Job.Worker 3]
       Initial Block Size 32.0 KB
       Current Block Size 32.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
-    [ALLOC_TEMP_BatchDeleteObjects]
-      Initial Block Size 64.0 KB
-      Current Block Size 64.0 KB
-      Peak Allocated Bytes 0 B
-      Overflow Count 0
-    [ALLOC_TEMP_AUDIO_FMOD stream thread]
       Initial Block Size 64.0 KB
       Current Block Size 64.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
-    [ALLOC_TEMP_Background Job.Worker 2]
       Initial Block Size 32.0 KB
       Current Block Size 32.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
-    [ALLOC_TEMP_Background Job.Worker 7]
       Initial Block Size 32.0 KB
       Current Block Size 32.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
-    [ALLOC_TEMP_Background Job.Worker 15]
       Initial Block Size 32.0 KB
       Current Block Size 32.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
-    [ALLOC_TEMP_Loading.PreloadManager]
-      Initial Block Size 256.0 KB
-      Current Block Size 320.0 KB
-      Peak Allocated Bytes 251.5 KB
-      Overflow Count 4
-    [ALLOC_TEMP_Profiler.Dispatcher]
-      Initial Block Size 64.0 KB
-      Current Block Size 64.0 KB
-      Peak Allocated Bytes 240 B
-      Overflow Count 0
-    [ALLOC_TEMP_Background Job.Worker 12]
       Initial Block Size 32.0 KB
       Current Block Size 32.0 KB
       Peak Allocated Bytes 0 B
@@ -171,64 +143,48 @@ PlayerConnection::CleanupMemory Statistics:
       Current Block Size 32.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
-    [ALLOC_TEMP_Background Job.Worker 0]
       Initial Block Size 32.0 KB
       Current Block Size 32.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
-    [ALLOC_TEMP_Background Job.Worker 4]
       Initial Block Size 32.0 KB
       Current Block Size 32.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
-    [ALLOC_TEMP_Job.Worker 0]
-      Initial Block Size 256.0 KB
-      Current Block Size 256.0 KB
-      Peak Allocated Bytes 0.8 KB
-      Overflow Count 0
-    [ALLOC_TEMP_Background Job.Worker 9]
       Initial Block Size 32.0 KB
       Current Block Size 32.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
-    [ALLOC_TEMP_Background Job.Worker 14]
       Initial Block Size 32.0 KB
       Current Block Size 32.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
-    [ALLOC_TEMP_EnlightenWorker]
       Initial Block Size 64.0 KB
       Current Block Size 64.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
-    [ALLOC_TEMP_Loading.AsyncRead]
-      Initial Block Size 64.0 KB
-      Current Block Size 64.0 KB
-      Peak Allocated Bytes 128 B
-      Overflow Count 0
-[ALLOC_MEMORYPROFILER]
-  Peak usage frame count: [0.5 MB-1.0 MB]: 299 frames, [1.0 MB-2.0 MB]: 43012 frames
-  Requested Block Size 1.0 MB
-  Peak Block count 2
-  Peak Allocated memory 1.6 MB
-  Peak Large allocation bytes 0 B
 [ALLOC_DEFAULT] Dual Thread Allocator
-  Peak main deferred allocation count 11050
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
-      Peak Allocated bytes 1.7 MB
     [ALLOC_DEFAULT_MAIN]
-      Peak usage frame count: [8.0 MB-16.0 MB]: 1 frames, [16.0 MB-32.0 MB]: 43310 frames
       Requested Block Size 16.0 MB
-      Peak Block count 3
-      Peak Allocated memory 31.5 MB
       Peak Large allocation bytes 0 B
     [ALLOC_DEFAULT_THREAD]
-      Peak usage frame count: [16.0 MB-32.0 MB]: 43311 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
-      Peak Allocated memory 22.0 MB
       Peak Large allocation bytes 16.0 MB
 [ALLOC_TEMP_JOB_1_FRAME]
   Initial Block Size 2.0 MB
@@ -255,63 +211,52 @@ PlayerConnection::CleanupMemory Statistics:
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
-      Peak Allocated bytes 1.7 MB
     [ALLOC_GFX_MAIN]
-      Peak usage frame count: [32.0 KB-64.0 KB]: 43310 frames, [64.0 KB-128.0 KB]: 1 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
-      Peak Allocated memory 67.0 KB
       Peak Large allocation bytes 0 B
     [ALLOC_GFX_THREAD]
-      Peak usage frame count: [64.0 KB-128.0 KB]: 43311 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
-      Peak Allocated memory 67.7 KB
       Peak Large allocation bytes 0 B
 [ALLOC_CACHEOBJECTS] Dual Thread Allocator
-  Peak main deferred allocation count 1
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
-      Peak Allocated bytes 1.7 MB
     [ALLOC_CACHEOBJECTS_MAIN]
-      Peak usage frame count: [0.5 MB-1.0 MB]: 299 frames, [1.0 MB-2.0 MB]: 43012 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
-      Peak Allocated memory 1.4 MB
       Peak Large allocation bytes 0 B
     [ALLOC_CACHEOBJECTS_THREAD]
-      Peak usage frame count: [1.0 MB-2.0 MB]: 43310 frames, [4.0 MB-8.0 MB]: 1 frames
       Requested Block Size 4.0 MB
-      Peak Block count 2
-      Peak Allocated memory 4.7 MB
       Peak Large allocation bytes 0 B
 [ALLOC_TYPETREE] Dual Thread Allocator
   Peak main deferred allocation count 0
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
-      Peak Allocated bytes 1.7 MB
     [ALLOC_TYPETREE_MAIN]
-      Peak usage frame count: [0-1.0 KB]: 43311 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.0 KB
       Peak Large allocation bytes 0 B
     [ALLOC_TYPETREE_THREAD]
-      Peak usage frame count: [1.0 KB-2.0 KB]: 43311 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
-      Peak Allocated memory 1.9 KB
       Peak Large allocation bytes 0 B
-[ALLOC_PROFILER]
-  Peak usage frame count: [16.0 KB-32.0 KB]: 43311 frames
-  Requested Block Size 16.0 MB
-  Peak Block count 1
-  Peak Allocated memory 29.2 KB
-  Peak Large allocation bytes 0 B
-    [ALLOC_PROFILER_BUCKET]
-      Large Block size 4.0 MB
-      Used Block count 1
-      Peak Allocated bytes 396 B
-##utp:{"type":"MemoryLeaks","version":2,"phase":"Immediate","time":1747825520277,"processId":2769,"allocatedMemory":1970133,"memoryLabels":[{"Default":9033},{"Permanent":1264},{"NewDelete":12801},{"Thread":34460},{"Manager":10603},{"VertexData":12},{"Geometry":280},{"Texture":16},{"Shader":69173},{"Material":24},{"GfxDevice":35248},{"Animation":304},{"Audio":3976},{"Physics":288},{"Serialization":216},{"Input":9176},{"JobScheduler":200},{"Mono":40},{"ScriptingNativeRuntime":216},{"BaseObject":1609212},{"Resource":592},{"Renderer":1936},{"Transform":48},{"File":800},{"WebCam":24},{"Culling":40},{"Terrain":953},{"Wind":24},{"String":3447},{"DynamicArray":30868},{"HashMap":7680},{"Utility":1360},{"PoolAlloc":1160},{"TypeTree":1792},{"ScriptManager":80},{"RuntimeInitializeOnLoadManager":72},{"SpriteAtlas":112},{"GI":3272},{"Unet":16},{"Director":7760},{"WebRequest":720},{"VR":45473},{"SceneManager":424},{"Video":32},{"LazyScriptCache":32},{"NativeArray":384},{"Camera":25},{"Secure":1},{"SerializationCache":624},{"APIUpdating":5872},{"Subsystems":384},{"VirtualTexturing":57552},{"AssetReference":32}]}

+Mono path[0] = '/content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/Managed'
+Mono config path = '/content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/MonoBleedingEdge/etc'
 Preloaded 'lib_burst_generated.so'
 Preloaded 'libgrpc_csharp_ext.x64.so'
+PlayerPrefs - Creating folder: /root/.config/unity3d/Hugging Face
+PlayerPrefs - Creating folder: /root/.config/unity3d/Hugging Face/SnowballTarget
 Unable to load player prefs
+Initialize engine version: 2021.3.14f1 (eee1884e7226)
+[Subsystems] Discovering subsystems at path /content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/UnitySubsystems
 Forcing GfxDevice: Null
 GfxDevice: creating device client; threaded=0; jobified=0
 NullGfxDevice:
 FMOD failed to initialize the output device.: "Error initializing output device. " (60)
 FMOD initialized on nosound output
 Begin MonoManager ReloadAssembly
+- Completed reload, in  0.085 seconds
 ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 WARNING: Shader Unsupported: 'Standard' - All subshaders removed
 WARNING: Shader Did you use #pragma only_renderers and omit this platform?
 WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
 WARNING: Shader Unsupported: 'Standard' - All subshaders removed
 WARNING: Shader Did you use #pragma only_renderers and omit this platform?
 WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
+UnloadTime: 0.684726 ms
 ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 requesting resize 84 x 84
 Setting up 1 worker threads for Enlighten.
+Memory Statistics:
 [ALLOC_TEMP_TLS] TLS Allocator
   StackAllocators :
     [ALLOC_TEMP_MAIN]
+      Peak usage frame count: [8.0 KB-16.0 KB]: 5367 frames, [16.0 KB-32.0 KB]: 90 frames, [2.0 MB-4.0 MB]: 1 frames
       Initial Block Size 4.0 MB
       Current Block Size 4.0 MB
       Peak Allocated Bytes 2.0 MB
       Overflow Count 0
+    [ALLOC_TEMP_Loading.AsyncRead]
+      Initial Block Size 64.0 KB
+      Current Block Size 64.0 KB
+      Peak Allocated Bytes 198 B
+      Overflow Count 0
+    [ALLOC_TEMP_Loading.PreloadManager]
+      Initial Block Size 256.0 KB
+      Current Block Size 304.0 KB
+      Peak Allocated Bytes 228.9 KB
+      Overflow Count 4
     [ALLOC_TEMP_Background Job.Worker 8]
       Initial Block Size 32.0 KB
       Current Block Size 32.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
+    [ALLOC_TEMP_Background Job.Worker 9]
       Initial Block Size 32.0 KB
       Current Block Size 32.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
+    [ALLOC_TEMP_Job.Worker 0]
+      Initial Block Size 256.0 KB
+      Current Block Size 256.0 KB
+      Peak Allocated Bytes 3.6 KB
+      Overflow Count 0
+    [ALLOC_TEMP_Background Job.Worker 10]
       Initial Block Size 32.0 KB
       Current Block Size 32.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
+    [ALLOC_TEMP_Background Job.Worker 14]
       Initial Block Size 32.0 KB
       Current Block Size 32.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
+    [ALLOC_TEMP_Background Job.Worker 6]
       Initial Block Size 32.0 KB
       Current Block Size 32.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
+    [ALLOC_TEMP_Background Job.Worker 12]
       Initial Block Size 32.0 KB
       Current Block Size 32.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
+    [ALLOC_TEMP_EnlightenWorker]
       Initial Block Size 64.0 KB
       Current Block Size 64.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
+    [ALLOC_TEMP_Background Job.Worker 15]
       Initial Block Size 32.0 KB
       Current Block Size 32.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
+    [ALLOC_TEMP_Background Job.Worker 1]
       Initial Block Size 32.0 KB
       Current Block Size 32.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
+    [ALLOC_TEMP_Background Job.Worker 2]
       Initial Block Size 32.0 KB
       Current Block Size 32.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
+    [ALLOC_TEMP_Background Job.Worker 7]
       Initial Block Size 32.0 KB
       Current Block Size 32.0 KB
       Peak Allocated Bytes 0 B
       Current Block Size 32.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
+    [ALLOC_TEMP_Background Job.Worker 11]
       Initial Block Size 32.0 KB
       Current Block Size 32.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
+    [ALLOC_TEMP_Background Job.Worker 3]
       Initial Block Size 32.0 KB
       Current Block Size 32.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
+    [ALLOC_TEMP_Background Job.Worker 0]
       Initial Block Size 32.0 KB
       Current Block Size 32.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
+    [ALLOC_TEMP_Background Job.Worker 4]
       Initial Block Size 32.0 KB
       Current Block Size 32.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
+    [ALLOC_TEMP_BatchDeleteObjects]
       Initial Block Size 64.0 KB
       Current Block Size 64.0 KB
       Peak Allocated Bytes 0 B
       Overflow Count 0
 [ALLOC_DEFAULT] Dual Thread Allocator
+  Peak main deferred allocation count 45
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
+      Peak Allocated bytes 1.0 MB
     [ALLOC_DEFAULT_MAIN]
+      Peak usage frame count: [4.0 MB-8.0 MB]: 5458 frames
       Requested Block Size 16.0 MB
+      Peak Block count 1
+      Peak Allocated memory 6.6 MB
       Peak Large allocation bytes 0 B
     [ALLOC_DEFAULT_THREAD]
+      Peak usage frame count: [16.0 MB-32.0 MB]: 5458 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
+      Peak Allocated memory 17.9 MB
       Peak Large allocation bytes 16.0 MB
 [ALLOC_TEMP_JOB_1_FRAME]
   Initial Block Size 2.0 MB
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
+      Peak Allocated bytes 1.0 MB
     [ALLOC_GFX_MAIN]
+      Peak usage frame count: [32.0 KB-64.0 KB]: 4981 frames, [64.0 KB-128.0 KB]: 477 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
+      Peak Allocated memory 67.3 KB
       Peak Large allocation bytes 0 B
     [ALLOC_GFX_THREAD]
+      Peak usage frame count: [32.0 KB-64.0 KB]: 5458 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
+      Peak Allocated memory 39.6 KB
       Peak Large allocation bytes 0 B
 [ALLOC_CACHEOBJECTS] Dual Thread Allocator
+  Peak main deferred allocation count 0
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
+      Peak Allocated bytes 1.0 MB
     [ALLOC_CACHEOBJECTS_MAIN]
+      Peak usage frame count: [0.5 MB-1.0 MB]: 5458 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
+      Peak Allocated memory 0.6 MB
       Peak Large allocation bytes 0 B
     [ALLOC_CACHEOBJECTS_THREAD]
+      Peak usage frame count: [0.5 MB-1.0 MB]: 5457 frames, [2.0 MB-4.0 MB]: 1 frames
       Requested Block Size 4.0 MB
+      Peak Block count 1
+      Peak Allocated memory 2.2 MB
       Peak Large allocation bytes 0 B
 [ALLOC_TYPETREE] Dual Thread Allocator
   Peak main deferred allocation count 0
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
+      Peak Allocated bytes 1.0 MB
     [ALLOC_TYPETREE_MAIN]
+      Peak usage frame count: [0-1.0 KB]: 5458 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.0 KB
       Peak Large allocation bytes 0 B
     [ALLOC_TYPETREE_THREAD]
+      Peak usage frame count: [1.0 KB-2.0 KB]: 5458 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
+      Peak Allocated memory 1.7 KB
       Peak Large allocation bytes 0 B

run_logs/timers.json CHANGED Viewed

@@ -1,250 +1,214 @@
 {
     "name": "root",
     "gauges": {
-        "Pyramids.Policy.Entropy.mean": {
-            "value": 0.23484036326408386,
-            "min": 0.23266544938087463,
-            "max": 1.408982276916504,
-            "count": 76
         },
-        "Pyramids.Policy.Entropy.sum": {
-            "value": 7052.7255859375,
-            "min": 6961.35009765625,
-            "max": 42742.88671875,
-            "count": 76
         },
-        "Pyramids.Step.mean": {
-            "value": 2279960.0,
-            "min": 29952.0,
-            "max": 2279960.0,
-            "count": 76
         },
-        "Pyramids.Step.sum": {
-            "value": 2279960.0,
-            "min": 29952.0,
-            "max": 2279960.0,
-            "count": 76
         },
-        "Pyramids.Policy.ExtrinsicValueEstimate.mean": {
-            "value": 0.8057253360748291,
-            "min": -0.09411876648664474,
-            "max": 0.8561700582504272,
-            "count": 76
         },
-        "Pyramids.Policy.ExtrinsicValueEstimate.sum": {
-            "value": 242.52333068847656,
-            "min": -22.870861053466797,
-            "max": 260.27569580078125,
-            "count": 76
         },
-        "Pyramids.Policy.RndValueEstimate.mean": {
-            "value": 0.006281580310314894,
-            "min": -0.08096986263990402,
-            "max": 0.699350118637085,
-            "count": 76
         },
-        "Pyramids.Policy.RndValueEstimate.sum": {
-            "value": 1.8907556533813477,
-            "min": -21.21410369873047,
-            "max": 165.7459716796875,
-            "count": 76
         },
-        "Pyramids.Losses.PolicyLoss.mean": {
-            "value": 0.06779443854854132,
-            "min": 0.06443775010174507,
-            "max": 0.07398701549620654,
-            "count": 76
         },
-        "Pyramids.Losses.PolicyLoss.sum": {
-            "value": 0.9491221396795786,
-            "min": 0.5179091084734457,
-            "max": 1.088565707311728,
-            "count": 76
         },
-        "Pyramids.Losses.ValueLoss.mean": {
-            "value": 0.014877840269556537,
-            "min": 0.000366937582077912,
-            "max": 0.017074454442546187,
-            "count": 76
         },
-        "Pyramids.Losses.ValueLoss.sum": {
-            "value": 0.20828976377379152,
-            "min": 0.0044032509849349435,
-            "max": 0.2561168166381928,
-            "count": 76
         },
-        "Pyramids.Policy.LearningRate.mean": {
-            "value": 7.351536835204521e-05,
-            "min": 7.351536835204521e-05,
-            "max": 0.00029838354339596195,
-            "count": 76
         },
-        "Pyramids.Policy.LearningRate.sum": {
-            "value": 0.001029215156928633,
-            "min": 0.001029215156928633,
-            "max": 0.0039692895769035,
-            "count": 76
         },
-        "Pyramids.Policy.Epsilon.mean": {
-            "value": 0.12450509761904763,
-            "min": 0.12450509761904763,
-            "max": 0.19946118095238097,
-            "count": 76
         },
-        "Pyramids.Policy.Epsilon.sum": {
-            "value": 1.7430713666666668,
-            "min": 1.3962282666666668,
-            "max": 2.7230965,
-            "count": 76
         },
-        "Pyramids.Policy.Beta.mean": {
-            "value": 0.0024580592521428572,
-            "min": 0.0024580592521428572,
-            "max": 0.009946171977142856,
-            "count": 76
         },
-        "Pyramids.Policy.Beta.sum": {
-            "value": 0.03441282953,
-            "min": 0.03441282953,
-            "max": 0.13231734035,
-            "count": 76
         },
-        "Pyramids.Losses.RNDLoss.mean": {
-            "value": 0.007769245188683271,
-            "min": 0.007686541881412268,
-            "max": 0.624336302280426,
-            "count": 76
         },
-        "Pyramids.Losses.RNDLoss.sum": {
-            "value": 0.10876943171024323,
-            "min": 0.10761158913373947,
-            "max": 4.370354175567627,
-            "count": 76
         },
-        "Pyramids.Environment.EpisodeLength.mean": {
-            "value": 239.616,
-            "min": 209.04379562043795,
-            "max": 999.0,
-            "count": 76
         },
-        "Pyramids.Environment.EpisodeLength.sum": {
-            "value": 29952.0,
-            "min": 15984.0,
-            "max": 32952.0,
-            "count": 76
         },
-        "Pyramids.Environment.CumulativeReward.mean": {
-            "value": 1.7443775829076766,
-            "min": -1.0000000521540642,
-            "max": 1.7909561924255677,
-            "count": 76
-        },
-        "Pyramids.Environment.CumulativeReward.sum": {
-            "value": 218.0471978634596,
-            "min": -31.99640165269375,
-            "max": 245.36099836230278,
-            "count": 76
-        },
-        "Pyramids.Policy.ExtrinsicReward.mean": {
-            "value": 1.7443775829076766,
-            "min": -1.0000000521540642,
-            "max": 1.7909561924255677,
-            "count": 76
-        },
-        "Pyramids.Policy.ExtrinsicReward.sum": {
-            "value": 218.0471978634596,
-            "min": -31.99640165269375,
-            "max": 245.36099836230278,
-            "count": 76
-        },
-        "Pyramids.Policy.RndReward.mean": {
-            "value": 0.019240734382416122,
-            "min": 0.01671900214845345,
-            "max": 13.039072195068002,
-            "count": 76
-        },
-        "Pyramids.Policy.RndReward.sum": {
-            "value": 2.405091797802015,
-            "min": 2.290503294338123,
-            "max": 208.62515512108803,
-            "count": 76
-        },
-        "Pyramids.IsTraining.mean": {
             "value": 1.0,
             "min": 1.0,
             "max": 1.0,
-            "count": 76
         },
-        "Pyramids.IsTraining.sum": {
             "value": 1.0,
             "min": 1.0,
             "max": 1.0,
-            "count": 76
         }
     },
     "metadata": {
         "timer_format_version": "0.1.0",
-        "start_time_seconds": "1747820019",
         "python_version": "3.10.12 (main, Jul  5 2023, 18:54:27) [GCC 11.2.0]",
-        "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
         "mlagents_version": "1.2.0.dev0",
         "mlagents_envs_version": "1.2.0.dev0",
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "2.7.0+cu126",
         "numpy_version": "1.23.5",
-        "end_time_seconds": "1747825520"
     },
-    "total": 5500.60708736,
     "count": 1,
-    "self": 0.4038944320000155,
     "children": {
         "run_training.setup": {
-            "total": 0.02201564800009237,
             "count": 1,
-            "self": 0.02201564800009237
         },
         "TrainerController.start_learning": {
-            "total": 5500.18117728,
             "count": 1,
-            "self": 3.0123167031688354,
             "children": {
                 "TrainerController._reset_env": {
-                    "total": 3.3193438119999428,
                     "count": 1,
-                    "self": 3.3193438119999428
                 },
                 "TrainerController.advance": {
-                    "total": 5493.719128906832,
-                    "count": 149434,
-                    "self": 3.2605887727695517,
                     "children": {
                         "env_step": {
-                            "total": 3969.6480270299935,
-                            "count": 149434,
-                            "self": 3636.970388604138,
                             "children": {
                                 "SubprocessEnvManager._take_step": {
-                                    "total": 330.93491936889984,
-                                    "count": 149434,
-                                    "self": 10.282463170940105,
                                     "children": {
                                         "TorchPolicy.evaluate": {
-                                            "total": 320.65245619795974,
-                                            "count": 144370,
-                                            "self": 320.65245619795974
                                         }
                                     }
                                 },
                                 "workers": {
-                                    "total": 1.7427190569558206,
-                                    "count": 149433,
                                     "self": 0.0,
                                     "children": {
                                         "worker_root": {
-                                            "total": 5489.06271309916,
-                                            "count": 149433,
                                             "is_parallel": true,
-                                            "self": 2105.9187310312045,
                                             "children": {
                                                 "run_training.setup": {
                                                     "total": 0.0,
@@ -253,48 +217,48 @@
                                                     "self": 0.0,
                                                     "children": {
                                                         "steps_from_proto": {
-                                                            "total": 0.0055780170000616636,
                                                             "count": 1,
                                                             "is_parallel": true,
-                                                            "self": 0.004291077999937443,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
-                                                                    "total": 0.001286939000124221,
-                                                                    "count": 8,
                                                                     "is_parallel": true,
-                                                                    "self": 0.001286939000124221
                                                                 }
                                                             }
                                                         },
                                                         "UnityEnvironment.step": {
-                                                            "total": 0.04780464300006315,
                                                             "count": 1,
                                                             "is_parallel": true,
-                                                            "self": 0.0005516119999811053,
                                                             "children": {
                                                                 "UnityEnvironment._generate_step_input": {
-                                                                    "total": 0.00047407600004589767,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.00047407600004589767
                                                                 },
                                                                 "communicator.exchange": {
-                                                                    "total": 0.0451506030000246,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.0451506030000246
                                                                 },
                                                                 "steps_from_proto": {
-                                                                    "total": 0.001628352000011546,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.0003737289999889981,
                                                                     "children": {
                                                                         "_process_rank_one_or_two_observation": {
-                                                                            "total": 0.0012546230000225478,
-                                                                            "count": 8,
                                                                             "is_parallel": true,
-                                                                            "self": 0.0012546230000225478
                                                                         }
                                                                     }
                                                                 }
@@ -303,34 +267,34 @@
                                                     }
                                                 },
                                                 "UnityEnvironment.step": {
-                                                    "total": 3383.143982067955,
-                                                    "count": 149432,
                                                     "is_parallel": true,
-                                                    "self": 71.99999781395582,
                                                     "children": {
                                                         "UnityEnvironment._generate_step_input": {
-                                                            "total": 52.933618838992516,
-                                                            "count": 149432,
                                                             "is_parallel": true,
-                                                            "self": 52.933618838992516
                                                         },
                                                         "communicator.exchange": {
-                                                            "total": 3041.1096478719824,
-                                                            "count": 149432,
                                                             "is_parallel": true,
-                                                            "self": 3041.1096478719824
                                                         },
                                                         "steps_from_proto": {
-                                                            "total": 217.10071754302442,
-                                                            "count": 149432,
                                                             "is_parallel": true,
-                                                            "self": 43.885075777336624,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
-                                                                    "total": 173.2156417656878,
-                                                                    "count": 1195456,
                                                                     "is_parallel": true,
-                                                                    "self": 173.2156417656878
                                                                 }
                                                             }
                                                         }
@@ -343,31 +307,31 @@
                             }
                         },
                         "trainer_advance": {
-                            "total": 1520.8105131040688,
-                            "count": 149433,
-                            "self": 6.028905329054851,
                             "children": {
                                 "process_trajectory": {
-                                    "total": 295.482135553017,
-                                    "count": 149433,
-                                    "self": 295.08266985801595,
                                     "children": {
                                         "RLTrainer._checkpoint": {
-                                            "total": 0.3994656950010267,
                                             "count": 4,
-                                            "self": 0.3994656950010267
                                         }
                                     }
                                 },
                                 "_update_policy": {
-                                    "total": 1219.299472221997,
-                                    "count": 1069,
-                                    "self": 676.9231931110622,
                                     "children": {
                                         "TorchPPOOptimizer.update": {
-                                            "total": 542.3762791109347,
-                                            "count": 52575,
-                                            "self": 542.3762791109347
                                         }
                                     }
                                 }
@@ -376,19 +340,19 @@
                     }
                 },
                 "trainer_threads": {
-                    "total": 1.333999534836039e-06,
                     "count": 1,
-                    "self": 1.333999534836039e-06
                 },
                 "TrainerController._save_models": {
-                    "total": 0.13038652399973216,
                     "count": 1,
-                    "self": 0.0017396149996784516,
                     "children": {
                         "RLTrainer._checkpoint": {
-                            "total": 0.1286469090000537,
                             "count": 1,
-                            "self": 0.1286469090000537
                         }
                     }
                 }

 {
     "name": "root",
     "gauges": {
+        "SnowballTarget.Policy.Entropy.mean": {
+            "value": 0.8584476709365845,
+            "min": 0.8584476709365845,
+            "max": 2.842935800552368,
+            "count": 20
         },
+        "SnowballTarget.Policy.Entropy.sum": {
+            "value": 8158.6865234375,
+            "min": 8158.6865234375,
+            "max": 29020.689453125,
+            "count": 20
         },
+        "SnowballTarget.Step.mean": {
+            "value": 199984.0,
+            "min": 9952.0,
+            "max": 199984.0,
+            "count": 20
         },
+        "SnowballTarget.Step.sum": {
+            "value": 199984.0,
+            "min": 9952.0,
+            "max": 199984.0,
+            "count": 20
         },
+        "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
+            "value": 13.049479484558105,
+            "min": 0.3136551082134247,
+            "max": 13.124421119689941,
+            "count": 20
         },
+        "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
+            "value": 2544.6484375,
+            "min": 60.849090576171875,
+            "max": 2680.4580078125,
+            "count": 20
         },
+        "SnowballTarget.Losses.PolicyLoss.mean": {
+            "value": 0.06658601740677042,
+            "min": 0.06315491588725754,
+            "max": 0.07810461898105703,
+            "count": 20
         },
+        "SnowballTarget.Losses.PolicyLoss.sum": {
+            "value": 0.2663440696270817,
+            "min": 0.25261966354903015,
+            "max": 0.36110270168865094,
+            "count": 20
         },
+        "SnowballTarget.Losses.ValueLoss.mean": {
+            "value": 0.21449150166967337,
+            "min": 0.13745489573864011,
+            "max": 0.2914017583517467,
+            "count": 20
         },
+        "SnowballTarget.Losses.ValueLoss.sum": {
+            "value": 0.8579660066786935,
+            "min": 0.5498195829545605,
+            "max": 1.331362451992783,
+            "count": 20
         },
+        "SnowballTarget.Policy.LearningRate.mean": {
+            "value": 8.082097306000005e-06,
+            "min": 8.082097306000005e-06,
+            "max": 0.000291882002706,
+            "count": 20
         },
+        "SnowballTarget.Policy.LearningRate.sum": {
+            "value": 3.232838922400002e-05,
+            "min": 3.232838922400002e-05,
+            "max": 0.00138516003828,
+            "count": 20
         },
+        "SnowballTarget.Policy.Epsilon.mean": {
+            "value": 0.10269400000000001,
+            "min": 0.10269400000000001,
+            "max": 0.19729400000000002,
+            "count": 20
         },
+        "SnowballTarget.Policy.Epsilon.sum": {
+            "value": 0.41077600000000003,
+            "min": 0.41077600000000003,
+            "max": 0.96172,
+            "count": 20
         },
+        "SnowballTarget.Policy.Beta.mean": {
+            "value": 0.0001444306000000001,
+            "min": 0.0001444306000000001,
+            "max": 0.0048649706,
+            "count": 20
         },
+        "SnowballTarget.Policy.Beta.sum": {
+            "value": 0.0005777224000000004,
+            "min": 0.0005777224000000004,
+            "max": 0.023089828,
+            "count": 20
         },
+        "SnowballTarget.Environment.EpisodeLength.mean": {
+            "value": 199.0,
+            "min": 199.0,
+            "max": 199.0,
+            "count": 20
         },
+        "SnowballTarget.Environment.EpisodeLength.sum": {
+            "value": 8756.0,
+            "min": 8756.0,
+            "max": 10945.0,
+            "count": 20
         },
+        "SnowballTarget.Environment.CumulativeReward.mean": {
+            "value": 25.818181818181817,
+            "min": 3.909090909090909,
+            "max": 25.818181818181817,
+            "count": 20
         },
+        "SnowballTarget.Environment.CumulativeReward.sum": {
+            "value": 1136.0,
+            "min": 172.0,
+            "max": 1410.0,
+            "count": 20
         },
+        "SnowballTarget.Policy.ExtrinsicReward.mean": {
+            "value": 25.818181818181817,
+            "min": 3.909090909090909,
+            "max": 25.818181818181817,
+            "count": 20
         },
+        "SnowballTarget.Policy.ExtrinsicReward.sum": {
+            "value": 1136.0,
+            "min": 172.0,
+            "max": 1410.0,
+            "count": 20
         },
+        "SnowballTarget.IsTraining.mean": {
             "value": 1.0,
             "min": 1.0,
             "max": 1.0,
+            "count": 20
         },
+        "SnowballTarget.IsTraining.sum": {
             "value": 1.0,
             "min": 1.0,
             "max": 1.0,
+            "count": 20
         }
     },
     "metadata": {
         "timer_format_version": "0.1.0",
+        "start_time_seconds": "1747865206",
         "python_version": "3.10.12 (main, Jul  5 2023, 18:54:27) [GCC 11.2.0]",
+        "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget1 --no-graphics",
         "mlagents_version": "1.2.0.dev0",
         "mlagents_envs_version": "1.2.0.dev0",
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "2.7.0+cu126",
         "numpy_version": "1.23.5",
+        "end_time_seconds": "1747865661"
     },
+    "total": 454.97723513399995,
     "count": 1,
+    "self": 0.4411420389999421,
     "children": {
         "run_training.setup": {
+            "total": 0.024227455000016107,
             "count": 1,
+            "self": 0.024227455000016107
         },
         "TrainerController.start_learning": {
+            "total": 454.51186564,
             "count": 1,
+            "self": 0.43310408800306277,
             "children": {
                 "TrainerController._reset_env": {
+                    "total": 3.4534281279999846,
                     "count": 1,
+                    "self": 3.4534281279999846
                 },
                 "TrainerController.advance": {
+                    "total": 450.54211882099696,
+                    "count": 18192,
+                    "self": 0.4419423699969798,
                     "children": {
                         "env_step": {
+                            "total": 320.99684070099534,
+                            "count": 18192,
+                            "self": 245.27953110598202,
                             "children": {
                                 "SubprocessEnvManager._take_step": {
+                                    "total": 75.46038014800388,
+                                    "count": 18192,
+                                    "self": 1.3905838039989362,
                                     "children": {
                                         "TorchPolicy.evaluate": {
+                                            "total": 74.06979634400494,
+                                            "count": 18192,
+                                            "self": 74.06979634400494
                                         }
                                     }
                                 },
                                 "workers": {
+                                    "total": 0.25692944700944054,
+                                    "count": 18192,
                                     "self": 0.0,
                                     "children": {
                                         "worker_root": {
+                                            "total": 452.9870898940104,
+                                            "count": 18192,
                                             "is_parallel": true,
+                                            "self": 238.74046401700815,
                                             "children": {
                                                 "run_training.setup": {
                                                     "total": 0.0,
                                                     "self": 0.0,
                                                     "children": {
                                                         "steps_from_proto": {
+                                                            "total": 0.005886660999976812,
                                                             "count": 1,
                                                             "is_parallel": true,
+                                                            "self": 0.004318263999948613,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
+                                                                    "total": 0.0015683970000281988,
+                                                                    "count": 10,
                                                                     "is_parallel": true,
+                                                                    "self": 0.0015683970000281988
                                                                 }
                                                             }
                                                         },
                                                         "UnityEnvironment.step": {
+                                                            "total": 0.046809171999996124,
                                                             "count": 1,
                                                             "is_parallel": true,
+                                                            "self": 0.0005961800000591211,
                                                             "children": {
                                                                 "UnityEnvironment._generate_step_input": {
+                                                                    "total": 0.0004709409999463787,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.0004709409999463787
                                                                 },
                                                                 "communicator.exchange": {
+                                                                    "total": 0.04391261000000668,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.04391261000000668
                                                                 },
                                                                 "steps_from_proto": {
+                                                                    "total": 0.0018294409999839445,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.0003484389999925952,
                                                                     "children": {
                                                                         "_process_rank_one_or_two_observation": {
+                                                                            "total": 0.0014810019999913493,
+                                                                            "count": 10,
                                                                             "is_parallel": true,
+                                                                            "self": 0.0014810019999913493
                                                                         }
                                                                     }
                                                                 }
                                                     }
                                                 },
                                                 "UnityEnvironment.step": {
+                                                    "total": 214.24662587700226,
+                                                    "count": 18191,
                                                     "is_parallel": true,
+                                                    "self": 10.248900232997414,
                                                     "children": {
                                                         "UnityEnvironment._generate_step_input": {
+                                                            "total": 5.588276356995493,
+                                                            "count": 18191,
                                                             "is_parallel": true,
+                                                            "self": 5.588276356995493
                                                         },
                                                         "communicator.exchange": {
+                                                            "total": 165.94509448300454,
+                                                            "count": 18191,
                                                             "is_parallel": true,
+                                                            "self": 165.94509448300454
                                                         },
                                                         "steps_from_proto": {
+                                                            "total": 32.46435480400481,
+                                                            "count": 18191,
                                                             "is_parallel": true,
+                                                            "self": 6.0540524750153395,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
+                                                                    "total": 26.410302328989474,
+                                                                    "count": 181910,
                                                                     "is_parallel": true,
+                                                                    "self": 26.410302328989474
                                                                 }
                                                             }
                                                         }
                             }
                         },
                         "trainer_advance": {
+                            "total": 129.10333575000465,
+                            "count": 18192,
+                            "self": 0.5324587160004057,
                             "children": {
                                 "process_trajectory": {
+                                    "total": 28.391561994004576,
+                                    "count": 18192,
+                                    "self": 27.960574152004654,
                                     "children": {
                                         "RLTrainer._checkpoint": {
+                                            "total": 0.43098784199992224,
                                             "count": 4,
+                                            "self": 0.43098784199992224
                                         }
                                     }
                                 },
                                 "_update_policy": {
+                                    "total": 100.17931503999966,
+                                    "count": 90,
+                                    "self": 40.61161785399406,
                                     "children": {
                                         "TorchPPOOptimizer.update": {
+                                            "total": 59.5676971860056,
+                                            "count": 4587,
+                                            "self": 59.5676971860056
                                         }
                                     }
                                 }
                     }
                 },
                 "trainer_threads": {
+                    "total": 9.149999868895975e-07,
                     "count": 1,
+                    "self": 9.149999868895975e-07
                 },
                 "TrainerController._save_models": {
+                    "total": 0.08321368800000073,
                     "count": 1,
+                    "self": 0.0008544639999854553,
                     "children": {
                         "RLTrainer._checkpoint": {
+                            "total": 0.08235922400001527,
                             "count": 1,
+                            "self": 0.08235922400001527
                         }
                     }
                 }

run_logs/training_status.json CHANGED Viewed

@@ -1,59 +1,59 @@
 {
-    "Pyramids": {
         "checkpoints": [
             {
-                "steps": 499932,
-                "file_path": "results/Pyramids Training/Pyramids/Pyramids-499932.onnx",
-                "reward": null,
-                "creation_time": 1747821013.4841912,
                 "auxillary_file_paths": [
-                    "results/Pyramids Training/Pyramids/Pyramids-499932.pt"
                 ]
             },
             {
-                "steps": 999974,
-                "file_path": "results/Pyramids Training/Pyramids/Pyramids-999974.onnx",
-                "reward": 1.6546666125456493,
-                "creation_time": 1747822169.9901326,
                 "auxillary_file_paths": [
-                    "results/Pyramids Training/Pyramids/Pyramids-999974.pt"
                 ]
             },
             {
-                "steps": 1499897,
-                "file_path": "results/Pyramids Training/Pyramids/Pyramids-1499897.onnx",
-                "reward": null,
-                "creation_time": 1747823431.5009575,
                 "auxillary_file_paths": [
-                    "results/Pyramids Training/Pyramids/Pyramids-1499897.pt"
                 ]
             },
             {
-                "steps": 1999944,
-                "file_path": "results/Pyramids Training/Pyramids/Pyramids-1999944.onnx",
-                "reward": 1.8343333154916763,
-                "creation_time": 1747824717.2055092,
                 "auxillary_file_paths": [
-                    "results/Pyramids Training/Pyramids/Pyramids-1999944.pt"
                 ]
             },
             {
-                "steps": 2308937,
-                "file_path": "results/Pyramids Training/Pyramids/Pyramids-2308937.onnx",
-                "reward": 1.8876666277647018,
-                "creation_time": 1747825519.9423451,
                 "auxillary_file_paths": [
-                    "results/Pyramids Training/Pyramids/Pyramids-2308937.pt"
                 ]
             }
         ],
         "final_checkpoint": {
-            "steps": 2308937,
-            "file_path": "results/Pyramids Training/Pyramids.onnx",
-            "reward": 1.8876666277647018,
-            "creation_time": 1747825519.9423451,
             "auxillary_file_paths": [
-                "results/Pyramids Training/Pyramids/Pyramids-2308937.pt"
             ]
         }
     },

 {
+    "SnowballTarget": {
         "checkpoints": [
             {
+                "steps": 49936,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-49936.onnx",
+                "reward": 17.272727272727273,
+                "creation_time": 1747865320.000131,
                 "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-49936.pt"
                 ]
             },
             {
+                "steps": 99960,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-99960.onnx",
+                "reward": 22.818181818181817,
+                "creation_time": 1747865432.4897733,
                 "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-99960.pt"
                 ]
             },
             {
+                "steps": 149984,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-149984.onnx",
+                "reward": 25.545454545454547,
+                "creation_time": 1747865548.956846,
                 "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-149984.pt"
                 ]
             },
             {
+                "steps": 199984,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-199984.onnx",
+                "reward": 25.90909090909091,
+                "creation_time": 1747865660.5671692,
                 "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-199984.pt"
                 ]
             },
             {
+                "steps": 200112,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.onnx",
+                "reward": 25.90909090909091,
+                "creation_time": 1747865660.6622632,
                 "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
                 ]
             }
         ],
         "final_checkpoint": {
+            "steps": 200112,
+            "file_path": "results/SnowballTarget1/SnowballTarget.onnx",
+            "reward": 25.90909090909091,
+            "creation_time": 1747865660.6622632,
             "auxillary_file_paths": [
+                "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
             ]
         }
     },