Deinigu commited on Nov 7, 2025

Commit

66bb524

verified ·

1 Parent(s): 7c13340

Second training

Browse files

Files changed (28) hide show

SnowballTarget.onnx +1 -1
SnowballTarget/SnowballTarget-349904.onnx +3 -0
SnowballTarget/SnowballTarget-349904.pt +3 -0
SnowballTarget/SnowballTarget-399992.onnx +3 -0
SnowballTarget/SnowballTarget-399992.pt +3 -0
SnowballTarget/SnowballTarget-449992.onnx +3 -0
SnowballTarget/SnowballTarget-449992.pt +3 -0
SnowballTarget/SnowballTarget-499888.onnx +3 -0
SnowballTarget/SnowballTarget-499888.pt +3 -0
SnowballTarget/SnowballTarget-549976.onnx +3 -0
SnowballTarget/SnowballTarget-549976.pt +3 -0
SnowballTarget/SnowballTarget-599936.onnx +3 -0
SnowballTarget/SnowballTarget-599936.pt +3 -0
SnowballTarget/SnowballTarget-601216.onnx +3 -0
SnowballTarget/SnowballTarget-601216.pt +3 -0
SnowballTarget/checkpoint.pt +1 -1
SnowballTarget/events.out.tfevents.1762516276.1696528d3eb8.13852.0 +3 -0
SnowballTarget/events.out.tfevents.1762516310.1696528d3eb8.14051.0 +3 -0
SnowballTarget/events.out.tfevents.1762516326.1696528d3eb8.14172.0 +3 -0
SnowballTarget/events.out.tfevents.1762516380.1696528d3eb8.14451.0 +3 -0
SnowballTarget/events.out.tfevents.1762516416.1696528d3eb8.14658.0 +3 -0
SnowballTarget/events.out.tfevents.1762516478.1696528d3eb8.14973.0 +3 -0
SnowballTarget/events.out.tfevents.1762516961.1696528d3eb8.17069.0 +3 -0
config.json +1 -1
configuration.yaml +2 -2
run_logs/Player-0.log +14 -17
run_logs/timers.json +162 -162
run_logs/training_status.json +46 -28

SnowballTarget.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0d62a0f07d4d14d0bcd11ce3bb11267188ae6449c22af14cc61b81aa70fc3066
 size 650646

 version https://git-lfs.github.com/spec/v1
+oid sha256:6585d80c29790a373df80fe4ff475e06f1f3580daf21556880f03f1287deedfd
 size 650646

SnowballTarget/SnowballTarget-349904.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e06883af0a54913f4103034e13accbfcd9fe22349fed9d5c332536e9aa6e4537
+size 650646

SnowballTarget/SnowballTarget-349904.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:df030c82a18fca63bb33d47638b3b42acfdce5318e8aff7eacd13d22fd383762
+size 3850564

SnowballTarget/SnowballTarget-399992.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1f96e6752002978b5e6c52764e9c5ca3829f6eae79c621cba5ee1713f0c82343
+size 650646

SnowballTarget/SnowballTarget-399992.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d46c3a164e723dce6a4cb45d5f9631146aaa3377fee8de2a023fa2f9bf98df92
+size 3850564

SnowballTarget/SnowballTarget-449992.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7a8701db369a38a873481f4b1d28dfc1fbff8906717f5f1ff8da077cf9fd1375
+size 650646

SnowballTarget/SnowballTarget-449992.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b377310a81362e77ad1ad2a3ad6083bd348a53e08d6f33edcf66a22b5d85a6d5
+size 3850564

SnowballTarget/SnowballTarget-499888.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2da6f6520f8ffbfbdf79a3953fa04e5d2b05c5adc670763de0bc8f28d60ad668
+size 650646

SnowballTarget/SnowballTarget-499888.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7802173a8d296843d588f00448b30b97e0e00c2fb2ba996bab28598df250edbc
+size 3850564

SnowballTarget/SnowballTarget-549976.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0f0b5d59dd6f2ebbdebe038cd12fe90e85c1c1173c2d7700f0462dce9e3aeae7
+size 650646

SnowballTarget/SnowballTarget-549976.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bcb4763c0b676054b40403c9b495b4f6f2dce961edfef8bf7f2ae6b43331dc88
+size 3850564

SnowballTarget/SnowballTarget-599936.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6585d80c29790a373df80fe4ff475e06f1f3580daf21556880f03f1287deedfd
+size 650646

SnowballTarget/SnowballTarget-599936.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:241a6c125e858e271db27eafcef316b58c9baf20a20e60c641a56072a3d87d94
+size 3850564

SnowballTarget/SnowballTarget-601216.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6585d80c29790a373df80fe4ff475e06f1f3580daf21556880f03f1287deedfd
+size 650646

SnowballTarget/SnowballTarget-601216.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dde4ef79e73ffa1be74af00888871fa806f6020dfe90487debfec79417cb19bd
+size 3850564

SnowballTarget/checkpoint.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:03ac616c4cdf1fe3d9dab4ce8f9586a2e00dced6508903d56ab2879c11004757
 size 3849717

 version https://git-lfs.github.com/spec/v1
+oid sha256:06e6442f3ac1f9c1543765a11284c1e7c8443b9c8afbc3152d3148cf3786d20c
 size 3849717

SnowballTarget/events.out.tfevents.1762516276.1696528d3eb8.13852.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6d415bf4c5fedc2d98a809bed99306d354f4a762708fa8b89955be1dd0f585b3
+size 1117

SnowballTarget/events.out.tfevents.1762516310.1696528d3eb8.14051.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:993e2da654be8713104951fbbd63e09442b2fc24385490802bee43bd18c918f7
+size 1117

SnowballTarget/events.out.tfevents.1762516326.1696528d3eb8.14172.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2a2c985db463e67b777ba2b58d3be173f2af8900f708c188fdad51cbac91542b
+size 1117

SnowballTarget/events.out.tfevents.1762516380.1696528d3eb8.14451.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a1786bbb553785d4c0af3c2d249104edb21f156b66788214f1a12ec76e099312
+size 1117

SnowballTarget/events.out.tfevents.1762516416.1696528d3eb8.14658.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b71b219c03ea90e7dc0cd6c2506691d9503e8459ddc865cbbd2a9a861c335070
+size 1117

SnowballTarget/events.out.tfevents.1762516478.1696528d3eb8.14973.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:00cb0eca41063fb6c49066785e8c612daf13215236a3a9332953d0eab1f092fa
+size 11335

SnowballTarget/events.out.tfevents.1762516961.1696528d3eb8.17069.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3efbbacb589da797cae34ed1a64db48722c4e428ff862f9b2d1845c1637484ec
+size 35134

config.json CHANGED Viewed

@@ -1 +1 @@

- {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 1024, "buffer_size": 4096, "learning_rate": 0.0001, "beta": 0.0005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 50000, "network_settings": {"normalize": false, "hidden_units": 256, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 7, "even_checkpoints": false, "max_steps": ~~200000~~, "time_horizon": 128, "summary_freq": 10000, "threaded": false, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SnowballTarget/SnowballTarget", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SnowballTarget1", "initialize_from": null, "load_model": false, "resume": ~~false~~, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

+ {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 1024, "buffer_size": 4096, "learning_rate": 0.0001, "beta": 0.0005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 50000, "network_settings": {"normalize": false, "hidden_units": 256, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 7, "even_checkpoints": false, "max_steps": 600000, "time_horizon": 128, "summary_freq": 10000, "threaded": false, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SnowballTarget/SnowballTarget", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SnowballTarget1", "initialize_from": null, "load_model": false, "resume": true, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

configuration.yaml CHANGED Viewed

@@ -38,7 +38,7 @@ behaviors:
     init_path: null
     keep_checkpoints: 7
     even_checkpoints: false
-    max_steps: 200000
     time_horizon: 128
     summary_freq: 10000
     threaded: false
@@ -69,7 +69,7 @@ checkpoint_settings:
   run_id: SnowballTarget1
   initialize_from: null
   load_model: false
-  resume: false
   force: false
   train_model: false
   inference: false

     init_path: null
     keep_checkpoints: 7
     even_checkpoints: false
+    max_steps: 600000
     time_horizon: 128
     summary_freq: 10000
     threaded: false
   run_id: SnowballTarget1
   initialize_from: null
   load_model: false
+  resume: true
   force: false
   train_model: false
   inference: false

run_logs/Player-0.log CHANGED Viewed

@@ -2,9 +2,6 @@ Mono path[0] = '/content/ml-agents/training-envs-executables/linux/SnowballTarge
 Mono config path = '/content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/MonoBleedingEdge/etc'
 Preloaded 'lib_burst_generated.so'
 Preloaded 'libgrpc_csharp_ext.x64.so'
-PlayerPrefs - Creating folder: /root/.config/unity3d/Hugging Face
-PlayerPrefs - Creating folder: /root/.config/unity3d/Hugging Face/SnowballTarget
-Unable to load player prefs
 Initialize engine version: 2021.3.14f1 (eee1884e7226)
 [Subsystems] Discovering subsystems at path /content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/UnitySubsystems
 Forcing GfxDevice: Null
@@ -34,7 +31,7 @@ ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM default
 FMOD failed to initialize the output device.: "Error initializing output device. " (60)
 FMOD initialized on nosound output
 Begin MonoManager ReloadAssembly
-- Completed reload, in  0.082 seconds
 ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
@@ -45,7 +42,7 @@ ERROR: Shader Standard shader is not supported on this GPU (none of subshaders/f
 WARNING: Shader Unsupported: 'Standard' - All subshaders removed
 WARNING: Shader Did you use #pragma only_renderers and omit this platform?
 WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
-UnloadTime: 0.642780 ms
 ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 requesting resize 84 x 84
 Setting up 1 worker threads for Enlighten.
@@ -53,7 +50,7 @@ Memory Statistics:
 [ALLOC_TEMP_TLS] TLS Allocator
   StackAllocators :
     [ALLOC_TEMP_MAIN]
-      Peak usage frame count: [8.0 KB-16.0 KB]: 5368 frames, [16.0 KB-32.0 KB]: 91 frames, [2.0 MB-4.0 MB]: 1 frames
       Initial Block Size 4.0 MB
       Current Block Size 4.0 MB
       Peak Allocated Bytes 2.0 MB
@@ -169,19 +166,19 @@ Memory Statistics:
       Peak Allocated Bytes 0 B
       Overflow Count 0
 [ALLOC_DEFAULT] Dual Thread Allocator
-  Peak main deferred allocation count 44
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_DEFAULT_MAIN]
-      Peak usage frame count: [4.0 MB-8.0 MB]: 5460 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
-      Peak Allocated memory 7.4 MB
       Peak Large allocation bytes 0 B
     [ALLOC_DEFAULT_THREAD]
-      Peak usage frame count: [16.0 MB-32.0 MB]: 5460 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 17.2 MB
@@ -213,13 +210,13 @@ Memory Statistics:
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_GFX_MAIN]
-      Peak usage frame count: [32.0 KB-64.0 KB]: 3847 frames, [64.0 KB-128.0 KB]: 1613 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
-      Peak Allocated memory 67.3 KB
       Peak Large allocation bytes 0 B
     [ALLOC_GFX_THREAD]
-      Peak usage frame count: [32.0 KB-64.0 KB]: 5460 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 39.6 KB
@@ -231,13 +228,13 @@ Memory Statistics:
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_CACHEOBJECTS_MAIN]
-      Peak usage frame count: [0.5 MB-1.0 MB]: 5460 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 0.6 MB
       Peak Large allocation bytes 0 B
     [ALLOC_CACHEOBJECTS_THREAD]
-      Peak usage frame count: [0.5 MB-1.0 MB]: 5459 frames, [2.0 MB-4.0 MB]: 1 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 2.2 MB
@@ -249,13 +246,13 @@ Memory Statistics:
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_TYPETREE_MAIN]
-      Peak usage frame count: [0-1.0 KB]: 5460 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.0 KB
       Peak Large allocation bytes 0 B
     [ALLOC_TYPETREE_THREAD]
-      Peak usage frame count: [1.0 KB-2.0 KB]: 5460 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.7 KB

 Mono config path = '/content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/MonoBleedingEdge/etc'
 Preloaded 'lib_burst_generated.so'
 Preloaded 'libgrpc_csharp_ext.x64.so'
 Initialize engine version: 2021.3.14f1 (eee1884e7226)
 [Subsystems] Discovering subsystems at path /content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/UnitySubsystems
 Forcing GfxDevice: Null
 FMOD failed to initialize the output device.: "Error initializing output device. " (60)
 FMOD initialized on nosound output
 Begin MonoManager ReloadAssembly
+- Completed reload, in  0.090 seconds
 ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 WARNING: Shader Unsupported: 'Standard' - All subshaders removed
 WARNING: Shader Did you use #pragma only_renderers and omit this platform?
 WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
+UnloadTime: 0.623103 ms
 ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 requesting resize 84 x 84
 Setting up 1 worker threads for Enlighten.
 [ALLOC_TEMP_TLS] TLS Allocator
   StackAllocators :
     [ALLOC_TEMP_MAIN]
+      Peak usage frame count: [8.0 KB-16.0 KB]: 8062 frames, [16.0 KB-32.0 KB]: 136 frames, [2.0 MB-4.0 MB]: 1 frames
       Initial Block Size 4.0 MB
       Current Block Size 4.0 MB
       Peak Allocated Bytes 2.0 MB
       Peak Allocated Bytes 0 B
       Overflow Count 0
 [ALLOC_DEFAULT] Dual Thread Allocator
+  Peak main deferred allocation count 46
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_DEFAULT_MAIN]
+      Peak usage frame count: [4.0 MB-8.0 MB]: 8199 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
+      Peak Allocated memory 7.8 MB
       Peak Large allocation bytes 0 B
     [ALLOC_DEFAULT_THREAD]
+      Peak usage frame count: [16.0 MB-32.0 MB]: 8199 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 17.2 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_GFX_MAIN]
+      Peak usage frame count: [32.0 KB-64.0 KB]: 2592 frames, [64.0 KB-128.0 KB]: 5607 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
+      Peak Allocated memory 68.6 KB
       Peak Large allocation bytes 0 B
     [ALLOC_GFX_THREAD]
+      Peak usage frame count: [32.0 KB-64.0 KB]: 8199 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 39.6 KB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_CACHEOBJECTS_MAIN]
+      Peak usage frame count: [0.5 MB-1.0 MB]: 8199 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 0.6 MB
       Peak Large allocation bytes 0 B
     [ALLOC_CACHEOBJECTS_THREAD]
+      Peak usage frame count: [0.5 MB-1.0 MB]: 8198 frames, [2.0 MB-4.0 MB]: 1 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 2.2 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_TYPETREE_MAIN]
+      Peak usage frame count: [0-1.0 KB]: 8199 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.0 KB
       Peak Large allocation bytes 0 B
     [ALLOC_TYPETREE_THREAD]
+      Peak usage frame count: [1.0 KB-2.0 KB]: 8199 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.7 KB

run_logs/timers.json CHANGED Viewed

@@ -2,213 +2,213 @@
     "name": "root",
     "gauges": {
         "SnowballTarget.Policy.Entropy.mean": {
-            "value": 2.3241453170776367,
-            "min": 2.3241453170776367,
-            "max": 2.890087842941284,
-            "count": 20
         },
         "SnowballTarget.Policy.Entropy.sum": {
-            "value": 22293.201171875,
-            "min": 22137.365234375,
-            "max": 31779.72265625,
-            "count": 20
         },
         "SnowballTarget.Step.mean": {
-            "value": 199984.0,
-            "min": 9952.0,
-            "max": 199984.0,
-            "count": 20
         },
         "SnowballTarget.Step.sum": {
-            "value": 199984.0,
-            "min": 9952.0,
-            "max": 199984.0,
-            "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
-            "value": 4.310549736022949,
-            "min": -0.01074505876749754,
-            "max": 4.310549736022949,
-            "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
-            "value": 435.36553955078125,
-            "min": -1.0422706604003906,
-            "max": 435.36553955078125,
-            "count": 20
         },
         "SnowballTarget.Environment.EpisodeLength.mean": {
             "value": 199.0,
             "min": 199.0,
             "max": 199.0,
-            "count": 20
         },
         "SnowballTarget.Environment.EpisodeLength.sum": {
             "value": 10945.0,
             "min": 8756.0,
             "max": 10945.0,
-            "count": 20
         },
         "SnowballTarget.Environment.CumulativeReward.mean": {
-            "value": 8.961538461538462,
-            "min": 2.6363636363636362,
-            "max": 8.961538461538462,
-            "count": 20
         },
         "SnowballTarget.Environment.CumulativeReward.sum": {
-            "value": 466.0,
-            "min": 116.0,
-            "max": 466.0,
-            "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicReward.mean": {
-            "value": 8.961538461538462,
-            "min": 2.6363636363636362,
-            "max": 8.961538461538462,
-            "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicReward.sum": {
-            "value": 466.0,
-            "min": 116.0,
-            "max": 466.0,
-            "count": 20
         },
         "SnowballTarget.Losses.PolicyLoss.mean": {
-            "value": 0.026437590531713795,
-            "min": 0.016743642057311565,
-            "max": 0.030202925961930305,
-            "count": 20
         },
         "SnowballTarget.Losses.PolicyLoss.sum": {
-            "value": 0.05287518106342759,
-            "min": 0.03348728411462313,
-            "max": 0.0800755696551884,
-            "count": 20
         },
         "SnowballTarget.Losses.ValueLoss.mean": {
-            "value": 0.31467231238881743,
-            "min": 0.12198344524949789,
-            "max": 0.32054602975646657,
-            "count": 20
         },
         "SnowballTarget.Losses.ValueLoss.sum": {
-            "value": 0.6293446247776349,
-            "min": 0.24396689049899578,
-            "max": 0.9477601523200669,
-            "count": 20
         },
         "SnowballTarget.Policy.LearningRate.mean": {
-            "value": 2.100097900000002e-06,
-            "min": 2.100097900000002e-06,
-            "max": 9.670000330000001e-05,
-            "count": 20
         },
         "SnowballTarget.Policy.LearningRate.sum": {
-            "value": 4.200195800000004e-06,
-            "min": 4.200195800000004e-06,
-            "max": 0.0002472000528,
-            "count": 20
         },
         "SnowballTarget.Policy.Epsilon.mean": {
-            "value": 0.1021,
-            "min": 0.1021,
-            "max": 0.19669999999999999,
-            "count": 20
         },
         "SnowballTarget.Policy.Epsilon.sum": {
-            "value": 0.2042,
-            "min": 0.2042,
-            "max": 0.5472,
-            "count": 20
         },
         "SnowballTarget.Policy.Beta.mean": {
-            "value": 2.0290000000000007e-05,
-            "min": 2.0290000000000007e-05,
-            "max": 0.0004838300000000001,
-            "count": 20
         },
         "SnowballTarget.Policy.Beta.sum": {
-            "value": 4.0580000000000015e-05,
-            "min": 4.0580000000000015e-05,
-            "max": 0.00124128,
-            "count": 20
         },
         "SnowballTarget.IsTraining.mean": {
             "value": 1.0,
             "min": 1.0,
             "max": 1.0,
-            "count": 20
         },
         "SnowballTarget.IsTraining.sum": {
             "value": 1.0,
             "min": 1.0,
             "max": 1.0,
-            "count": 20
         }
     },
     "metadata": {
         "timer_format_version": "0.1.0",
-        "start_time_seconds": "1762514617",
         "python_version": "3.10.12 (main, Jul  5 2023, 18:54:27) [GCC 11.2.0]",
-        "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget1 --no-graphics",
         "mlagents_version": "1.2.0.dev0",
         "mlagents_envs_version": "1.2.0.dev0",
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "2.8.0+cu128",
         "numpy_version": "1.23.5",
-        "end_time_seconds": "1762515010"
     },
-    "total": 392.75992730100006,
     "count": 1,
-    "self": 0.4307554690001325,
     "children": {
         "run_training.setup": {
-            "total": 0.025848885999948834,
             "count": 1,
-            "self": 0.025848885999948834
         },
         "TrainerController.start_learning": {
-            "total": 392.303322946,
             "count": 1,
-            "self": 0.3759268440167034,
             "children": {
                 "TrainerController._reset_env": {
-                    "total": 2.7668223719999787,
                     "count": 1,
-                    "self": 2.7668223719999787
                 },
                 "TrainerController.advance": {
-                    "total": 389.07903029298336,
-                    "count": 18200,
-                    "self": 0.3792768889875333,
                     "children": {
                         "env_step": {
-                            "total": 321.31676956099454,
-                            "count": 18200,
-                            "self": 250.54857935896212,
                             "children": {
                                 "SubprocessEnvManager._take_step": {
-                                    "total": 70.54734476501358,
-                                    "count": 18200,
-                                    "self": 1.275305534998779,
                                     "children": {
                                         "TorchPolicy.evaluate": {
-                                            "total": 69.2720392300148,
-                                            "count": 18200,
-                                            "self": 69.2720392300148
                                         }
                                     }
                                 },
                                 "workers": {
-                                    "total": 0.22084543701885195,
-                                    "count": 18200,
                                     "self": 0.0,
                                     "children": {
                                         "worker_root": {
-                                            "total": 390.59533471098644,
-                                            "count": 18200,
                                             "is_parallel": true,
-                                            "self": 170.57021740298683,
                                             "children": {
                                                 "run_training.setup": {
                                                     "total": 0.0,
@@ -217,48 +217,48 @@
                                                     "self": 0.0,
                                                     "children": {
                                                         "steps_from_proto": {
-                                                            "total": 0.004687703000172405,
                                                             "count": 1,
                                                             "is_parallel": true,
-                                                            "self": 0.003302252000594308,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
-                                                                    "total": 0.0013854509995780973,
                                                                     "count": 10,
                                                                     "is_parallel": true,
-                                                                    "self": 0.0013854509995780973
                                                                 }
                                                             }
                                                         },
                                                         "UnityEnvironment.step": {
-                                                            "total": 0.037418512000158444,
                                                             "count": 1,
                                                             "is_parallel": true,
-                                                            "self": 0.0006120630002897087,
                                                             "children": {
                                                                 "UnityEnvironment._generate_step_input": {
-                                                                    "total": 0.0004695739999078796,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.0004695739999078796
                                                                 },
                                                                 "communicator.exchange": {
-                                                                    "total": 0.03440155899988895,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.03440155899988895
                                                                 },
                                                                 "steps_from_proto": {
-                                                                    "total": 0.0019353160000719072,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.00036776299975826987,
                                                                     "children": {
                                                                         "_process_rank_one_or_two_observation": {
-                                                                            "total": 0.0015675530003136373,
                                                                             "count": 10,
                                                                             "is_parallel": true,
-                                                                            "self": 0.0015675530003136373
                                                                         }
                                                                     }
                                                                 }
@@ -267,34 +267,34 @@
                                                     }
                                                 },
                                                 "UnityEnvironment.step": {
-                                                    "total": 220.0251173079996,
-                                                    "count": 18199,
                                                     "is_parallel": true,
-                                                    "self": 10.229218741002569,
                                                     "children": {
                                                         "UnityEnvironment._generate_step_input": {
-                                                            "total": 5.431949275014631,
-                                                            "count": 18199,
                                                             "is_parallel": true,
-                                                            "self": 5.431949275014631
                                                         },
                                                         "communicator.exchange": {
-                                                            "total": 167.30069428099773,
-                                                            "count": 18199,
                                                             "is_parallel": true,
-                                                            "self": 167.30069428099773
                                                         },
                                                         "steps_from_proto": {
-                                                            "total": 37.063255010984676,
-                                                            "count": 18199,
                                                             "is_parallel": true,
-                                                            "self": 6.700471101969697,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
-                                                                    "total": 30.36278390901498,
-                                                                    "count": 181990,
                                                                     "is_parallel": true,
-                                                                    "self": 30.36278390901498
                                                                 }
                                                             }
                                                         }
@@ -307,31 +307,31 @@
                             }
                         },
                         "trainer_advance": {
-                            "total": 67.38298384300128,
-                            "count": 18200,
-                            "self": 0.5043809000158035,
                             "children": {
                                 "process_trajectory": {
-                                    "total": 21.229000259985924,
-                                    "count": 18200,
-                                    "self": 20.836893393985747,
                                     "children": {
                                         "RLTrainer._checkpoint": {
-                                            "total": 0.3921068660001765,
-                                            "count": 4,
-                                            "self": 0.3921068660001765
                                         }
                                     }
                                 },
                                 "_update_policy": {
-                                    "total": 45.64960268299956,
-                                    "count": 45,
-                                    "self": 35.14298270399968,
                                     "children": {
                                         "TorchPPOOptimizer.update": {
-                                            "total": 10.506619978999879,
-                                            "count": 540,
-                                            "self": 10.506619978999879
                                         }
                                     }
                                 }
@@ -340,19 +340,19 @@
                     }
                 },
                 "trainer_threads": {
-                    "total": 9.699999736767495e-07,
                     "count": 1,
-                    "self": 9.699999736767495e-07
                 },
                 "TrainerController._save_models": {
-                    "total": 0.08154246699996293,
                     "count": 1,
-                    "self": 0.0009384520001276542,
                     "children": {
                         "RLTrainer._checkpoint": {
-                            "total": 0.08060401499983527,
                             "count": 1,
-                            "self": 0.08060401499983527
                         }
                     }
                 }

     "name": "root",
     "gauges": {
         "SnowballTarget.Policy.Entropy.mean": {
+            "value": 1.2791601419448853,
+            "min": 1.2791601419448853,
+            "max": 2.036785364151001,
+            "count": 30
         },
         "SnowballTarget.Policy.Entropy.sum": {
+            "value": 14070.76171875,
+            "min": 11621.716796875,
+            "max": 20791.50390625,
+            "count": 30
         },
         "SnowballTarget.Step.mean": {
+            "value": 599936.0,
+            "min": 309920.0,
+            "max": 599936.0,
+            "count": 30
         },
         "SnowballTarget.Step.sum": {
+            "value": 599936.0,
+            "min": 309920.0,
+            "max": 599936.0,
+            "count": 30
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
+            "value": 7.021315574645996,
+            "min": 4.909838676452637,
+            "max": 7.07533073425293,
+            "count": 30
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
+            "value": 716.1741943359375,
+            "min": 451.7051696777344,
+            "max": 721.6837158203125,
+            "count": 30
         },
         "SnowballTarget.Environment.EpisodeLength.mean": {
             "value": 199.0,
             "min": 199.0,
             "max": 199.0,
+            "count": 30
         },
         "SnowballTarget.Environment.EpisodeLength.sum": {
             "value": 10945.0,
             "min": 8756.0,
             "max": 10945.0,
+            "count": 30
         },
         "SnowballTarget.Environment.CumulativeReward.mean": {
+            "value": 13.363636363636363,
+            "min": 9.886363636363637,
+            "max": 14.127659574468085,
+            "count": 30
         },
         "SnowballTarget.Environment.CumulativeReward.sum": {
+            "value": 735.0,
+            "min": 435.0,
+            "max": 747.0,
+            "count": 30
         },
         "SnowballTarget.Policy.ExtrinsicReward.mean": {
+            "value": 13.363636363636363,
+            "min": 9.886363636363637,
+            "max": 14.127659574468085,
+            "count": 30
         },
         "SnowballTarget.Policy.ExtrinsicReward.sum": {
+            "value": 735.0,
+            "min": 435.0,
+            "max": 747.0,
+            "count": 30
         },
         "SnowballTarget.Losses.PolicyLoss.mean": {
+            "value": 0.01730723716658152,
+            "min": 0.013768826169931952,
+            "max": 0.034235001677492015,
+            "count": 30
         },
         "SnowballTarget.Losses.PolicyLoss.sum": {
+            "value": 0.05192171149974456,
+            "min": 0.027537652339863904,
+            "max": 0.07840476820213856,
+            "count": 30
         },
         "SnowballTarget.Losses.ValueLoss.mean": {
+            "value": 0.30628854119115406,
+            "min": 0.2808823101222515,
+            "max": 0.36244359364112216,
+            "count": 30
         },
         "SnowballTarget.Losses.ValueLoss.sum": {
+            "value": 0.9188656235734622,
+            "min": 0.561764620244503,
+            "max": 0.9833823864658673,
+            "count": 30
         },
         "SnowballTarget.Policy.LearningRate.mean": {
+            "value": 7.654325679999995e-07,
+            "min": 7.654325679999995e-07,
+            "max": 4.879871786800001e-05,
+            "count": 30
         },
         "SnowballTarget.Policy.LearningRate.sum": {
+            "value": 2.2962977039999984e-06,
+            "min": 2.2962977039999984e-06,
+            "max": 0.000127696172304,
+            "count": 30
         },
         "SnowballTarget.Policy.Epsilon.mean": {
+            "value": 0.10076533333333333,
+            "min": 0.10076533333333333,
+            "max": 0.1487986666666667,
+            "count": 30
         },
         "SnowballTarget.Policy.Epsilon.sum": {
+            "value": 0.302296,
+            "min": 0.20519733333333337,
+            "max": 0.4276960000000001,
+            "count": 30
         },
         "SnowballTarget.Policy.Beta.mean": {
+            "value": 1.375013333333333e-05,
+            "min": 1.375013333333333e-05,
+            "max": 0.0002491134666666667,
+            "count": 30
         },
         "SnowballTarget.Policy.Beta.sum": {
+            "value": 4.1250399999999994e-05,
+            "min": 4.1250399999999994e-05,
+            "max": 0.0006557103999999999,
+            "count": 30
         },
         "SnowballTarget.IsTraining.mean": {
             "value": 1.0,
             "min": 1.0,
             "max": 1.0,
+            "count": 30
         },
         "SnowballTarget.IsTraining.sum": {
             "value": 1.0,
             "min": 1.0,
             "max": 1.0,
+            "count": 30
         }
     },
     "metadata": {
         "timer_format_version": "0.1.0",
+        "start_time_seconds": "1762516960",
         "python_version": "3.10.12 (main, Jul  5 2023, 18:54:27) [GCC 11.2.0]",
+        "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget1 --no-graphics --resume",
         "mlagents_version": "1.2.0.dev0",
         "mlagents_envs_version": "1.2.0.dev0",
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "2.8.0+cu128",
         "numpy_version": "1.23.5",
+        "end_time_seconds": "1762517552"
     },
+    "total": 592.2312760890004,
     "count": 1,
+    "self": 0.6854531370013319,
     "children": {
         "run_training.setup": {
+            "total": 0.025205188999734673,
             "count": 1,
+            "self": 0.025205188999734673
         },
         "TrainerController.start_learning": {
+            "total": 591.5206177629993,
             "count": 1,
+            "self": 0.634241693968761,
             "children": {
                 "TrainerController._reset_env": {
+                    "total": 1.8806869069999266,
                     "count": 1,
+                    "self": 1.8806869069999266
                 },
                 "TrainerController.advance": {
+                    "total": 588.891397155031,
+                    "count": 27328,
+                    "self": 0.6099100390879357,
                     "children": {
                         "env_step": {
+                            "total": 484.2565340659221,
+                            "count": 27328,
+                            "self": 378.1459005417764,
                             "children": {
                                 "SubprocessEnvManager._take_step": {
+                                    "total": 105.73474780199558,
+                                    "count": 27328,
+                                    "self": 1.931934716001706,
                                     "children": {
                                         "TorchPolicy.evaluate": {
+                                            "total": 103.80281308599388,
+                                            "count": 27328,
+                                            "self": 103.80281308599388
                                         }
                                     }
                                 },
                                 "workers": {
+                                    "total": 0.37588572215008753,
+                                    "count": 27328,
                                     "self": 0.0,
                                     "children": {
                                         "worker_root": {
+                                            "total": 588.6466735419563,
+                                            "count": 27328,
                                             "is_parallel": true,
+                                            "self": 257.60993185196867,
                                             "children": {
                                                 "run_training.setup": {
                                                     "total": 0.0,
                                                     "self": 0.0,
                                                     "children": {
                                                         "steps_from_proto": {
+                                                            "total": 0.0025357979998261726,
                                                             "count": 1,
                                                             "is_parallel": true,
+                                                            "self": 0.0007605889991282311,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
+                                                                    "total": 0.0017752090006979415,
                                                                     "count": 10,
                                                                     "is_parallel": true,
+                                                                    "self": 0.0017752090006979415
                                                                 }
                                                             }
                                                         },
                                                         "UnityEnvironment.step": {
+                                                            "total": 0.036977805999867996,
                                                             "count": 1,
                                                             "is_parallel": true,
+                                                            "self": 0.0005932839994784445,
                                                             "children": {
                                                                 "UnityEnvironment._generate_step_input": {
+                                                                    "total": 0.0003188280002177635,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.0003188280002177635
                                                                 },
                                                                 "communicator.exchange": {
+                                                                    "total": 0.03413033800006815,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.03413033800006815
                                                                 },
                                                                 "steps_from_proto": {
+                                                                    "total": 0.0019353560001036385,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.0003527700005179213,
                                                                     "children": {
                                                                         "_process_rank_one_or_two_observation": {
+                                                                            "total": 0.0015825859995857172,
                                                                             "count": 10,
                                                                             "is_parallel": true,
+                                                                            "self": 0.0015825859995857172
                                                                         }
                                                                     }
                                                                 }
                                                     }
                                                 },
                                                 "UnityEnvironment.step": {
+                                                    "total": 331.0367416899876,
+                                                    "count": 27327,
                                                     "is_parallel": true,
+                                                    "self": 15.200489163059956,
                                                     "children": {
                                                         "UnityEnvironment._generate_step_input": {
+                                                            "total": 8.095992872050374,
+                                                            "count": 27327,
                                                             "is_parallel": true,
+                                                            "self": 8.095992872050374
                                                         },
                                                         "communicator.exchange": {
+                                                            "total": 252.92622028195092,
+                                                            "count": 27327,
                                                             "is_parallel": true,
+                                                            "self": 252.92622028195092
                                                         },
                                                         "steps_from_proto": {
+                                                            "total": 54.814039372926345,
+                                                            "count": 27327,
                                                             "is_parallel": true,
+                                                            "self": 10.048774410947317,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
+                                                                    "total": 44.76526496197903,
+                                                                    "count": 273270,
                                                                     "is_parallel": true,
+                                                                    "self": 44.76526496197903
                                                                 }
                                                             }
                                                         }
                             }
                         },
                         "trainer_advance": {
+                            "total": 104.02495305002094,
+                            "count": 27328,
+                            "self": 0.8198006880729736,
                             "children": {
                                 "process_trajectory": {
+                                    "total": 31.862228450949715,
+                                    "count": 27328,
+                                    "self": 31.236804354948617,
                                     "children": {
                                         "RLTrainer._checkpoint": {
+                                            "total": 0.6254240960010975,
+                                            "count": 6,
+                                            "self": 0.6254240960010975
                                         }
                                     }
                                 },
                                 "_update_policy": {
+                                    "total": 71.34292391099825,
+                                    "count": 68,
+                                    "self": 54.793426481001916,
                                     "children": {
                                         "TorchPPOOptimizer.update": {
+                                            "total": 16.549497429996336,
+                                            "count": 816,
+                                            "self": 16.549497429996336
                                         }
                                     }
                                 }
                     }
                 },
                 "trainer_threads": {
+                    "total": 1.139000232797116e-06,
                     "count": 1,
+                    "self": 1.139000232797116e-06
                 },
                 "TrainerController._save_models": {
+                    "total": 0.11429086799944344,
                     "count": 1,
+                    "self": 0.0016393489995607524,
                     "children": {
                         "RLTrainer._checkpoint": {
+                            "total": 0.11265151899988268,
                             "count": 1,
+                            "self": 0.11265151899988268
                         }
                     }
                 }

run_logs/training_status.json CHANGED Viewed

@@ -2,58 +2,76 @@
     "SnowballTarget": {
         "checkpoints": [
             {
-                "steps": 49952,
-                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-49952.onnx",
-                "reward": 3.5,
-                "creation_time": 1762514722.099842,
                 "auxillary_file_paths": [
-                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-49952.pt"
                 ]
             },
             {
-                "steps": 99896,
-                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-99896.onnx",
-                "reward": 7.090909090909091,
-                "creation_time": 1762514819.0264485,
                 "auxillary_file_paths": [
-                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-99896.pt"
                 ]
             },
             {
-                "steps": 149984,
-                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-149984.onnx",
                 "reward": null,
-                "creation_time": 1762514917.1551106,
                 "auxillary_file_paths": [
-                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-149984.pt"
                 ]
             },
             {
-                "steps": 199984,
-                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-199984.onnx",
-                "reward": 9.125,
-                "creation_time": 1762515009.988979,
                 "auxillary_file_paths": [
-                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-199984.pt"
                 ]
             },
             {
-                "steps": 200200,
-                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-200200.onnx",
-                "reward": 10.545454545454545,
-                "creation_time": 1762515010.0893934,
                 "auxillary_file_paths": [
-                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-200200.pt"
                 ]
             }
         ],
         "final_checkpoint": {
-            "steps": 200200,
             "file_path": "results/SnowballTarget1/SnowballTarget.onnx",
-            "reward": 10.545454545454545,
-            "creation_time": 1762515010.0893934,
             "auxillary_file_paths": [
-                "results/SnowballTarget1/SnowballTarget/SnowballTarget-200200.pt"
             ]
         }
     },

     "SnowballTarget": {
         "checkpoints": [
             {
+                "steps": 349904,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-349904.onnx",
+                "reward": null,
+                "creation_time": 1762517059.2028866,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-349904.pt"
+                ]
+            },
+            {
+                "steps": 399992,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-399992.onnx",
+                "reward": 12.363636363636363,
+                "creation_time": 1762517157.627532,
                 "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-399992.pt"
                 ]
             },
             {
+                "steps": 449992,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-449992.onnx",
+                "reward": 13.263157894736842,
+                "creation_time": 1762517255.1124034,
                 "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-449992.pt"
                 ]
             },
             {
+                "steps": 499888,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-499888.onnx",
                 "reward": null,
+                "creation_time": 1762517354.1441364,
                 "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-499888.pt"
                 ]
             },
             {
+                "steps": 549976,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-549976.onnx",
+                "reward": 15.090909090909092,
+                "creation_time": 1762517451.8545153,
                 "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-549976.pt"
                 ]
             },
             {
+                "steps": 599936,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-599936.onnx",
+                "reward": null,
+                "creation_time": 1762517551.917334,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-599936.pt"
+                ]
+            },
+            {
+                "steps": 601216,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-601216.onnx",
+                "reward": null,
+                "creation_time": 1762517552.311762,
                 "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-601216.pt"
                 ]
             }
         ],
         "final_checkpoint": {
+            "steps": 601216,
             "file_path": "results/SnowballTarget1/SnowballTarget.onnx",
+            "reward": null,
+            "creation_time": 1762517552.311762,
             "auxillary_file_paths": [
+                "results/SnowballTarget1/SnowballTarget/SnowballTarget-601216.pt"
             ]
         }
     },