LuckLin commited on Jan 5

Commit

4a1dd8e

verified ·

1 Parent(s): 73b6002

Upload ML-Agents results without video

Browse files

Files changed (18) hide show

README.md +8 -8
SnowballTarget.onnx +3 -0
SnowballTarget/SnowballTarget-149984.onnx +3 -0
SnowballTarget/SnowballTarget-149984.pt +3 -0
SnowballTarget/SnowballTarget-199984.onnx +3 -0
SnowballTarget/SnowballTarget-199984.pt +3 -0
SnowballTarget/SnowballTarget-200112.onnx +3 -0
SnowballTarget/SnowballTarget-200112.pt +3 -0
SnowballTarget/SnowballTarget-49936.onnx +3 -0
SnowballTarget/SnowballTarget-49936.pt +3 -0
SnowballTarget/SnowballTarget-99960.onnx +3 -0
SnowballTarget/SnowballTarget-99960.pt +3 -0
SnowballTarget/checkpoint.pt +3 -0
SnowballTarget/events.out.tfevents.1767604585.c4ec318824e8.5813.0 +3 -0
configuration.yaml +76 -0
run_logs/Player-0.log +262 -0
run_logs/timers.json +362 -0
run_logs/training_status.json +65 -0

README.md CHANGED Viewed

@@ -1,21 +1,21 @@
 ---
 tags:
 - ml-agents
-- deep-reinforcement-learning
 - reinforcement-learning
 - unity-ml-agents
 library_name: ml-agents
 ---
-# ML-Agents 训练展示：SnowballTarget
-这是使用 Unity ML-Agents 训练的 **SnowballTarget** 模型。
 ### 训练说明
-- **算法**: PPO
 - **运行 ID**: `SnowballTarget1`
-- **训练环境**: SnowballTarget
-### 如何使用
-你可以下载本项目中的 `results/SnowballTarget1` 文件夹，并将其放入 Unity 项目中进行推理。

 ---
 tags:
 - ml-agents
 - reinforcement-learning
 - unity-ml-agents
 library_name: ml-agents
 ---
+# ML-Agents: SnowballTarget 模型
+这是使用 Unity ML-Agents 训练的 **SnowballTarget** 智能体模型。
+### 包含文件
+* **SnowballTarget.onnx**: 训练好的神经网络模型文件，可直接导入 Unity。
+* **configuration.yaml**: 训练时使用的超参数配置。
+* **config.json**: 训练环境的相关元数据。
+* **run_logs**: TensorBoard 日志文件夹，记录了奖励值和 Loss 曲线。
 ### 训练说明
 - **运行 ID**: `SnowballTarget1`
+- **算法**: PPO

SnowballTarget.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:090a48a1d53280c47b9ce99138c1eaf448289c65de169b361af3382611c0d897
+size 646532

SnowballTarget/SnowballTarget-149984.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f634e650be0773a195f7eca6b0a58ab757e6349a2c192216bde644fef6242988
+size 646532

SnowballTarget/SnowballTarget-149984.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b7e604aafec37fd85d2b7091a4acaa217451ae11e0164037730cb93a95cddec0
+size 3843968

SnowballTarget/SnowballTarget-199984.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:090a48a1d53280c47b9ce99138c1eaf448289c65de169b361af3382611c0d897
+size 646532

SnowballTarget/SnowballTarget-199984.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:41c0b493152ff792dd736301942c2867f153e838e3ba9b27456a60c5faf3e427
+size 3843968

SnowballTarget/SnowballTarget-200112.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:090a48a1d53280c47b9ce99138c1eaf448289c65de169b361af3382611c0d897
+size 646532

SnowballTarget/SnowballTarget-200112.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ec4a7328d2f2f21808df92b8a16482e67e022d0231bbb503e4c972086423a7f4
+size 3843968

SnowballTarget/SnowballTarget-49936.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b711f65ca109a1a67c8f4edea03722a85b389ff94e32ba5d3a3e161c9a88ecce
+size 646532

SnowballTarget/SnowballTarget-49936.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f2a4e70d6d332743f3b50e81ec01da6761e95076001a74ac5c966470e4bc4876
+size 3843968

SnowballTarget/SnowballTarget-99960.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a5918d3bfcc7828d7d7674664824899d3588f26c58efdfcd0c636bc83473e1da
+size 646532

SnowballTarget/SnowballTarget-99960.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:da7b63021d5d516e3503d6111f73418c469317630e1f79f2c1942a96f6cb72f4
+size 3843968

SnowballTarget/checkpoint.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ec4a7328d2f2f21808df92b8a16482e67e022d0231bbb503e4c972086423a7f4
+size 3843968

SnowballTarget/events.out.tfevents.1767604585.c4ec318824e8.5813.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bb17739aadd9a54c89e8c5ecc20d6055f3d5e9157eec8f5ade7a0dabe50d551e
+size 23242

configuration.yaml ADDED Viewed

	@@ -0,0 +1,76 @@

+default_settings: null
+behaviors:
+  SnowballTarget:
+    trainer_type: ppo
+    hyperparameters:
+      batch_size: 128
+      buffer_size: 2048
+      learning_rate: 0.0003
+      beta: 0.005
+      epsilon: 0.2
+      lambd: 0.95
+      num_epoch: 3
+      shared_critic: false
+      learning_rate_schedule: linear
+      beta_schedule: linear
+      epsilon_schedule: linear
+    network_settings:
+      normalize: false
+      hidden_units: 256
+      num_layers: 2
+      vis_encode_type: simple
+      memory: null
+      goal_conditioning_type: hyper
+      deterministic: false
+    reward_signals:
+      extrinsic:
+        gamma: 0.99
+        strength: 1.0
+        network_settings:
+          normalize: false
+          hidden_units: 128
+          num_layers: 2
+          vis_encode_type: simple
+          memory: null
+          goal_conditioning_type: hyper
+          deterministic: false
+    init_path: null
+    keep_checkpoints: 10
+    checkpoint_interval: 50000
+    max_steps: 200000
+    time_horizon: 64
+    summary_freq: 10000
+    threaded: false
+    self_play: null
+    behavioral_cloning: null
+env_settings:
+  env_path: training-envs-executables/linux/SnowballTarget/SnowballTarget
+  env_args: null
+  base_port: 5005
+  num_envs: 1
+  num_areas: 1
+  seed: -1
+  max_lifetime_restarts: 10
+  restarts_rate_limit_n: 1
+  restarts_rate_limit_period_s: 60
+engine_settings:
+  width: 84
+  height: 84
+  quality_level: 5
+  time_scale: 20
+  target_frame_rate: -1
+  capture_frame_rate: 60
+  no_graphics: true
+environment_parameters: null
+checkpoint_settings:
+  run_id: SnowballTarget1
+  initialize_from: null
+  load_model: false
+  resume: false
+  force: false
+  train_model: false
+  inference: false
+  results_dir: results
+torch_settings:
+  device: null
+debug: false

run_logs/Player-0.log ADDED Viewed

	@@ -0,0 +1,262 @@

+Mono path[0] = '/content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/Managed'
+Mono config path = '/content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/MonoBleedingEdge/etc'
+Preloaded 'lib_burst_generated.so'
+Preloaded 'libgrpc_csharp_ext.x64.so'
+PlayerPrefs - Creating folder: /root/.config/unity3d/Hugging Face
+PlayerPrefs - Creating folder: /root/.config/unity3d/Hugging Face/SnowballTarget
+Unable to load player prefs
+Initialize engine version: 2021.3.14f1 (eee1884e7226)
+[Subsystems] Discovering subsystems at path /content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/UnitySubsystems
+Forcing GfxDevice: Null
+GfxDevice: creating device client; threaded=0; jobified=0
+NullGfxDevice:
+    Version:  NULL 1.0 [1.0]
+    Renderer: Null Device
+    Vendor:   Unity Technologies
+ALSA lib confmisc.c:855:(parse_card) cannot find card '0'
+ALSA lib conf.c:5178:(_snd_config_evaluate) function snd_func_card_inum returned error: No such file or directory
+ALSA lib confmisc.c:422:(snd_func_concat) error evaluating strings
+ALSA lib conf.c:5178:(_snd_config_evaluate) function snd_func_concat returned error: No such file or directory
+ALSA lib confmisc.c:1334:(snd_func_refer) error evaluating name
+ALSA lib conf.c:5178:(_snd_config_evaluate) function snd_func_refer returned error: No such file or directory
+ALSA lib conf.c:5701:(snd_config_expand) Evaluate error: No such file or directory
+ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM default
+FMOD failed to initialize the output device.: "Error initializing output device. " (60)
+Forced to initialize FMOD to to the device driver's system output rate 48000, this may impact performance and/or give inconsistent experiences compared to selected sample rate 48000
+ALSA lib confmisc.c:855:(parse_card) cannot find card '0'
+ALSA lib conf.c:5178:(_snd_config_evaluate) function snd_func_card_inum returned error: No such file or directory
+ALSA lib confmisc.c:422:(snd_func_concat) error evaluating strings
+ALSA lib conf.c:5178:(_snd_config_evaluate) function snd_func_concat returned error: No such file or directory
+ALSA lib confmisc.c:1334:(snd_func_refer) error evaluating name
+ALSA lib conf.c:5178:(_snd_config_evaluate) function snd_func_refer returned error: No such file or directory
+ALSA lib conf.c:5701:(snd_config_expand) Evaluate error: No such file or directory
+ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM default
+FMOD failed to initialize the output device.: "Error initializing output device. " (60)
+FMOD initialized on nosound output
+Begin MonoManager ReloadAssembly
+- Completed reload, in  0.083 seconds
+ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
+ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
+ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
+WARNING: Shader Unsupported: 'Standard' - All subshaders removed
+WARNING: Shader Did you use #pragma only_renderers and omit this platform?
+WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
+ERROR: Shader Standard shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
+WARNING: Shader Unsupported: 'Standard' - All subshaders removed
+WARNING: Shader Did you use #pragma only_renderers and omit this platform?
+WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
+UnloadTime: 0.634091 ms
+ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
+requesting resize 84 x 84
+Setting up 1 worker threads for Enlighten.
+Memory Statistics:
+[ALLOC_TEMP_TLS] TLS Allocator
+  StackAllocators :
+    [ALLOC_TEMP_MAIN]
+      Peak usage frame count: [8.0 KB-16.0 KB]: 5367 frames, [16.0 KB-32.0 KB]: 90 frames, [2.0 MB-4.0 MB]: 1 frames
+      Initial Block Size 4.0 MB
+      Current Block Size 4.0 MB
+      Peak Allocated Bytes 2.0 MB
+      Overflow Count 0
+    [ALLOC_TEMP_Loading.AsyncRead]
+      Initial Block Size 64.0 KB
+      Current Block Size 64.0 KB
+      Peak Allocated Bytes 198 B
+      Overflow Count 0
+    [ALLOC_TEMP_Loading.PreloadManager]
+      Initial Block Size 256.0 KB
+      Current Block Size 304.0 KB
+      Peak Allocated Bytes 228.9 KB
+      Overflow Count 4
+    [ALLOC_TEMP_Background Job.Worker 8]
+      Initial Block Size 32.0 KB
+      Current Block Size 32.0 KB
+      Peak Allocated Bytes 0 B
+      Overflow Count 0
+    [ALLOC_TEMP_Background Job.Worker 9]
+      Initial Block Size 32.0 KB
+      Current Block Size 32.0 KB
+      Peak Allocated Bytes 0 B
+      Overflow Count 0
+    [ALLOC_TEMP_Job.Worker 0]
+      Initial Block Size 256.0 KB
+      Current Block Size 256.0 KB
+      Peak Allocated Bytes 3.6 KB
+      Overflow Count 0
+    [ALLOC_TEMP_Background Job.Worker 10]
+      Initial Block Size 32.0 KB
+      Current Block Size 32.0 KB
+      Peak Allocated Bytes 0 B
+      Overflow Count 0
+    [ALLOC_TEMP_Background Job.Worker 14]
+      Initial Block Size 32.0 KB
+      Current Block Size 32.0 KB
+      Peak Allocated Bytes 0 B
+      Overflow Count 0
+    [ALLOC_TEMP_Background Job.Worker 6]
+      Initial Block Size 32.0 KB
+      Current Block Size 32.0 KB
+      Peak Allocated Bytes 0 B
+      Overflow Count 0
+    [ALLOC_TEMP_Background Job.Worker 12]
+      Initial Block Size 32.0 KB
+      Current Block Size 32.0 KB
+      Peak Allocated Bytes 0 B
+      Overflow Count 0
+    [ALLOC_TEMP_EnlightenWorker]
+      Initial Block Size 64.0 KB
+      Current Block Size 64.0 KB
+      Peak Allocated Bytes 0 B
+      Overflow Count 0
+    [ALLOC_TEMP_Background Job.Worker 15]
+      Initial Block Size 32.0 KB
+      Current Block Size 32.0 KB
+      Peak Allocated Bytes 0 B
+      Overflow Count 0
+    [ALLOC_TEMP_Background Job.Worker 1]
+      Initial Block Size 32.0 KB
+      Current Block Size 32.0 KB
+      Peak Allocated Bytes 0 B
+      Overflow Count 0
+    [ALLOC_TEMP_Background Job.Worker 2]
+      Initial Block Size 32.0 KB
+      Current Block Size 32.0 KB
+      Peak Allocated Bytes 0 B
+      Overflow Count 0
+    [ALLOC_TEMP_Background Job.Worker 7]
+      Initial Block Size 32.0 KB
+      Current Block Size 32.0 KB
+      Peak Allocated Bytes 0 B
+      Overflow Count 0
+    [ALLOC_TEMP_AssetGarbageCollectorHelper]
+      Initial Block Size 64.0 KB
+      Current Block Size 64.0 KB
+      Peak Allocated Bytes 0 B
+      Overflow Count 0
+    [ALLOC_TEMP_Background Job.Worker 5]
+      Initial Block Size 32.0 KB
+      Current Block Size 32.0 KB
+      Peak Allocated Bytes 0 B
+      Overflow Count 0
+    [ALLOC_TEMP_Background Job.Worker 13]
+      Initial Block Size 32.0 KB
+      Current Block Size 32.0 KB
+      Peak Allocated Bytes 0 B
+      Overflow Count 0
+    [ALLOC_TEMP_Background Job.Worker 11]
+      Initial Block Size 32.0 KB
+      Current Block Size 32.0 KB
+      Peak Allocated Bytes 0 B
+      Overflow Count 0
+    [ALLOC_TEMP_Background Job.Worker 3]
+      Initial Block Size 32.0 KB
+      Current Block Size 32.0 KB
+      Peak Allocated Bytes 0 B
+      Overflow Count 0
+    [ALLOC_TEMP_Background Job.Worker 0]
+      Initial Block Size 32.0 KB
+      Current Block Size 32.0 KB
+      Peak Allocated Bytes 0 B
+      Overflow Count 0
+    [ALLOC_TEMP_Background Job.Worker 4]
+      Initial Block Size 32.0 KB
+      Current Block Size 32.0 KB
+      Peak Allocated Bytes 0 B
+      Overflow Count 0
+    [ALLOC_TEMP_BatchDeleteObjects]
+      Initial Block Size 64.0 KB
+      Current Block Size 64.0 KB
+      Peak Allocated Bytes 0 B
+      Overflow Count 0
+[ALLOC_DEFAULT] Dual Thread Allocator
+  Peak main deferred allocation count 45
+    [ALLOC_BUCKET]
+      Large Block size 4.0 MB
+      Used Block count 1
+      Peak Allocated bytes 1.0 MB
+    [ALLOC_DEFAULT_MAIN]
+      Peak usage frame count: [4.0 MB-8.0 MB]: 5458 frames
+      Requested Block Size 16.0 MB
+      Peak Block count 1
+      Peak Allocated memory 7.2 MB
+      Peak Large allocation bytes 0 B
+    [ALLOC_DEFAULT_THREAD]
+      Peak usage frame count: [16.0 MB-32.0 MB]: 5458 frames
+      Requested Block Size 16.0 MB
+      Peak Block count 1
+      Peak Allocated memory 17.3 MB
+      Peak Large allocation bytes 16.0 MB
+[ALLOC_TEMP_JOB_1_FRAME]
+  Initial Block Size 2.0 MB
+  Used Block Count 1
+  Overflow Count (too large) 0
+  Overflow Count (full) 0
+[ALLOC_TEMP_JOB_2_FRAMES]
+  Initial Block Size 2.0 MB
+  Used Block Count 1
+  Overflow Count (too large) 0
+  Overflow Count (full) 0
+[ALLOC_TEMP_JOB_4_FRAMES (JobTemp)]
+  Initial Block Size 2.0 MB
+  Used Block Count 2
+  Overflow Count (too large) 0
+  Overflow Count (full) 0
+[ALLOC_TEMP_JOB_ASYNC (Background)]
+  Initial Block Size 1.0 MB
+  Used Block Count 3
+  Overflow Count (too large) 0
+  Overflow Count (full) 0
+[ALLOC_GFX] Dual Thread Allocator
+  Peak main deferred allocation count 0
+    [ALLOC_BUCKET]
+      Large Block size 4.0 MB
+      Used Block count 1
+      Peak Allocated bytes 1.0 MB
+    [ALLOC_GFX_MAIN]
+      Peak usage frame count: [32.0 KB-64.0 KB]: 3467 frames, [64.0 KB-128.0 KB]: 1991 frames
+      Requested Block Size 16.0 MB
+      Peak Block count 1
+      Peak Allocated memory 68.6 KB
+      Peak Large allocation bytes 0 B
+    [ALLOC_GFX_THREAD]
+      Peak usage frame count: [32.0 KB-64.0 KB]: 5458 frames
+      Requested Block Size 16.0 MB
+      Peak Block count 1
+      Peak Allocated memory 39.6 KB
+      Peak Large allocation bytes 0 B
+[ALLOC_CACHEOBJECTS] Dual Thread Allocator
+  Peak main deferred allocation count 0
+    [ALLOC_BUCKET]
+      Large Block size 4.0 MB
+      Used Block count 1
+      Peak Allocated bytes 1.0 MB
+    [ALLOC_CACHEOBJECTS_MAIN]
+      Peak usage frame count: [0.5 MB-1.0 MB]: 5458 frames
+      Requested Block Size 4.0 MB
+      Peak Block count 1
+      Peak Allocated memory 0.6 MB
+      Peak Large allocation bytes 0 B
+    [ALLOC_CACHEOBJECTS_THREAD]
+      Peak usage frame count: [0.5 MB-1.0 MB]: 5457 frames, [2.0 MB-4.0 MB]: 1 frames
+      Requested Block Size 4.0 MB
+      Peak Block count 1
+      Peak Allocated memory 2.2 MB
+      Peak Large allocation bytes 0 B
+[ALLOC_TYPETREE] Dual Thread Allocator
+  Peak main deferred allocation count 0
+    [ALLOC_BUCKET]
+      Large Block size 4.0 MB
+      Used Block count 1
+      Peak Allocated bytes 1.0 MB
+    [ALLOC_TYPETREE_MAIN]
+      Peak usage frame count: [0-1.0 KB]: 5458 frames
+      Requested Block Size 2.0 MB
+      Peak Block count 1
+      Peak Allocated memory 1.0 KB
+      Peak Large allocation bytes 0 B
+    [ALLOC_TYPETREE_THREAD]
+      Peak usage frame count: [1.0 KB-2.0 KB]: 5458 frames
+      Requested Block Size 2.0 MB
+      Peak Block count 1
+      Peak Allocated memory 1.7 KB
+      Peak Large allocation bytes 0 B

run_logs/timers.json ADDED Viewed

	@@ -0,0 +1,362 @@

+{
+    "name": "root",
+    "gauges": {
+        "SnowballTarget.Policy.Entropy.mean": {
+            "value": 0.7129193544387817,
+            "min": 0.7129193544387817,
+            "max": 2.8399477005004883,
+            "count": 20
+        },
+        "SnowballTarget.Policy.Entropy.sum": {
+            "value": 6775.58544921875,
+            "min": 6775.58544921875,
+            "max": 28990.185546875,
+            "count": 20
+        },
+        "SnowballTarget.Step.mean": {
+            "value": 199984.0,
+            "min": 9952.0,
+            "max": 199984.0,
+            "count": 20
+        },
+        "SnowballTarget.Step.sum": {
+            "value": 199984.0,
+            "min": 9952.0,
+            "max": 199984.0,
+            "count": 20
+        },
+        "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
+            "value": 12.568286895751953,
+            "min": 0.6493656039237976,
+            "max": 12.568286895751953,
+            "count": 20
+        },
+        "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
+            "value": 2450.81591796875,
+            "min": 125.9769287109375,
+            "max": 2512.68505859375,
+            "count": 20
+        },
+        "SnowballTarget.Losses.PolicyLoss.mean": {
+            "value": 0.06376773407671363,
+            "min": 0.06303729918003156,
+            "max": 0.07480492593056304,
+            "count": 20
+        },
+        "SnowballTarget.Losses.PolicyLoss.sum": {
+            "value": 0.2550709363068545,
+            "min": 0.25214919672012626,
+            "max": 0.3740246296528152,
+            "count": 20
+        },
+        "SnowballTarget.Losses.ValueLoss.mean": {
+            "value": 0.18687986184422878,
+            "min": 0.143810383259894,
+            "max": 0.2750409629707243,
+            "count": 20
+        },
+        "SnowballTarget.Losses.ValueLoss.sum": {
+            "value": 0.7475194473769151,
+            "min": 0.575241533039576,
+            "max": 1.2682422405364466,
+            "count": 20
+        },
+        "SnowballTarget.Policy.LearningRate.mean": {
+            "value": 8.082097306000005e-06,
+            "min": 8.082097306000005e-06,
+            "max": 0.000291882002706,
+            "count": 20
+        },
+        "SnowballTarget.Policy.LearningRate.sum": {
+            "value": 3.232838922400002e-05,
+            "min": 3.232838922400002e-05,
+            "max": 0.00138516003828,
+            "count": 20
+        },
+        "SnowballTarget.Policy.Epsilon.mean": {
+            "value": 0.10269400000000001,
+            "min": 0.10269400000000001,
+            "max": 0.19729400000000002,
+            "count": 20
+        },
+        "SnowballTarget.Policy.Epsilon.sum": {
+            "value": 0.41077600000000003,
+            "min": 0.41077600000000003,
+            "max": 0.96172,
+            "count": 20
+        },
+        "SnowballTarget.Policy.Beta.mean": {
+            "value": 0.0001444306000000001,
+            "min": 0.0001444306000000001,
+            "max": 0.0048649706,
+            "count": 20
+        },
+        "SnowballTarget.Policy.Beta.sum": {
+            "value": 0.0005777224000000004,
+            "min": 0.0005777224000000004,
+            "max": 0.023089828,
+            "count": 20
+        },
+        "SnowballTarget.Environment.EpisodeLength.mean": {
+            "value": 199.0,
+            "min": 199.0,
+            "max": 199.0,
+            "count": 20
+        },
+        "SnowballTarget.Environment.EpisodeLength.sum": {
+            "value": 8756.0,
+            "min": 8756.0,
+            "max": 10945.0,
+            "count": 20
+        },
+        "SnowballTarget.Environment.CumulativeReward.mean": {
+            "value": 25.386363636363637,
+            "min": 4.0227272727272725,
+            "max": 25.386363636363637,
+            "count": 20
+        },
+        "SnowballTarget.Environment.CumulativeReward.sum": {
+            "value": 1117.0,
+            "min": 177.0,
+            "max": 1350.0,
+            "count": 20
+        },
+        "SnowballTarget.Policy.ExtrinsicReward.mean": {
+            "value": 25.386363636363637,
+            "min": 4.0227272727272725,
+            "max": 25.386363636363637,
+            "count": 20
+        },
+        "SnowballTarget.Policy.ExtrinsicReward.sum": {
+            "value": 1117.0,
+            "min": 177.0,
+            "max": 1350.0,
+            "count": 20
+        },
+        "SnowballTarget.IsTraining.mean": {
+            "value": 1.0,
+            "min": 1.0,
+            "max": 1.0,
+            "count": 20
+        },
+        "SnowballTarget.IsTraining.sum": {
+            "value": 1.0,
+            "min": 1.0,
+            "max": 1.0,
+            "count": 20
+        }
+    },
+    "metadata": {
+        "timer_format_version": "0.1.0",
+        "start_time_seconds": "1767604584",
+        "python_version": "3.10.12 (main, Nov  4 2025, 08:48:33) [GCC 11.4.0]",
+        "command_line_arguments": "/usr/local/lib/python3.10/dist-packages/mlagents/trainers/learn.py config/ppo/SnowballTarget.yaml --env=training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget1 --no-graphics",
+        "mlagents_version": "0.30.0",
+        "mlagents_envs_version": "0.30.0",
+        "communication_protocol_version": "1.5.0",
+        "pytorch_version": "1.11.0+cu102",
+        "numpy_version": "1.21.2",
+        "end_time_seconds": "1767605004"
+    },
+    "total": 420.0462367729999,
+    "count": 1,
+    "self": 0.4789151130000846,
+    "children": {
+        "run_training.setup": {
+            "total": 0.015575675000036426,
+            "count": 1,
+            "self": 0.015575675000036426
+        },
+        "TrainerController.start_learning": {
+            "total": 419.5517459849998,
+            "count": 1,
+            "self": 0.39738225599649013,
+            "children": {
+                "TrainerController._reset_env": {
+                    "total": 4.351109004999898,
+                    "count": 1,
+                    "self": 4.351109004999898
+                },
+                "TrainerController.advance": {
+                    "total": 414.6711300170034,
+                    "count": 18192,
+                    "self": 0.3892191160005041,
+                    "children": {
+                        "env_step": {
+                            "total": 302.8226869550017,
+                            "count": 18192,
+                            "self": 251.713234211011,
+                            "children": {
+                                "SubprocessEnvManager._take_step": {
+                                    "total": 50.87050107098935,
+                                    "count": 18192,
+                                    "self": 1.8175279629947454,
+                                    "children": {
+                                        "TorchPolicy.evaluate": {
+                                            "total": 49.0529731079946,
+                                            "count": 18192,
+                                            "self": 49.0529731079946
+                                        }
+                                    }
+                                },
+                                "workers": {
+                                    "total": 0.23895167300133835,
+                                    "count": 18192,
+                                    "self": 0.0,
+                                    "children": {
+                                        "worker_root": {
+                                            "total": 417.7713763080035,
+                                            "count": 18192,
+                                            "is_parallel": true,
+                                            "self": 196.42828577999057,
+                                            "children": {
+                                                "run_training.setup": {
+                                                    "total": 0.0,
+                                                    "count": 0,
+                                                    "is_parallel": true,
+                                                    "self": 0.0,
+                                                    "children": {
+                                                        "steps_from_proto": {
+                                                            "total": 0.0019955570001002343,
+                                                            "count": 1,
+                                                            "is_parallel": true,
+                                                            "self": 0.0006047110000508837,
+                                                            "children": {
+                                                                "_process_rank_one_or_two_observation": {
+                                                                    "total": 0.0013908460000493506,
+                                                                    "count": 10,
+                                                                    "is_parallel": true,
+                                                                    "self": 0.0013908460000493506
+                                                                }
+                                                            }
+                                                        },
+                                                        "UnityEnvironment.step": {
+                                                            "total": 0.051043671999877915,
+                                                            "count": 1,
+                                                            "is_parallel": true,
+                                                            "self": 0.000589509999826987,
+                                                            "children": {
+                                                                "UnityEnvironment._generate_step_input": {
+                                                                    "total": 0.00043392099996708566,
+                                                                    "count": 1,
+                                                                    "is_parallel": true,
+                                                                    "self": 0.00043392099996708566
+                                                                },
+                                                                "communicator.exchange": {
+                                                                    "total": 0.04799759200000153,
+                                                                    "count": 1,
+                                                                    "is_parallel": true,
+                                                                    "self": 0.04799759200000153
+                                                                },
+                                                                "steps_from_proto": {
+                                                                    "total": 0.0020226490000823105,
+                                                                    "count": 1,
+                                                                    "is_parallel": true,
+                                                                    "self": 0.0003916860000572342,
+                                                                    "children": {
+                                                                        "_process_rank_one_or_two_observation": {
+                                                                            "total": 0.0016309630000250763,
+                                                                            "count": 10,
+                                                                            "is_parallel": true,
+                                                                            "self": 0.0016309630000250763
+                                                                        }
+                                                                    }
+                                                                }
+                                                            }
+                                                        }
+                                                    }
+                                                },
+                                                "UnityEnvironment.step": {
+                                                    "total": 221.3430905280129,
+                                                    "count": 18191,
+                                                    "is_parallel": true,
+                                                    "self": 9.899855793025836,
+                                                    "children": {
+                                                        "UnityEnvironment._generate_step_input": {
+                                                            "total": 5.500544546990795,
+                                                            "count": 18191,
+                                                            "is_parallel": true,
+                                                            "self": 5.500544546990795
+                                                        },
+                                                        "communicator.exchange": {
+                                                            "total": 166.24368432500364,
+                                                            "count": 18191,
+                                                            "is_parallel": true,
+                                                            "self": 166.24368432500364
+                                                        },
+                                                        "steps_from_proto": {
+                                                            "total": 39.699005862992635,
+                                                            "count": 18191,
+                                                            "is_parallel": true,
+                                                            "self": 7.0311746900054,
+                                                            "children": {
+                                                                "_process_rank_one_or_two_observation": {
+                                                                    "total": 32.667831172987235,
+                                                                    "count": 181910,
+                                                                    "is_parallel": true,
+                                                                    "self": 32.667831172987235
+                                                                }
+                                                            }
+                                                        }
+                                                    }
+                                                }
+                                            }
+                                        }
+                                    }
+                                }
+                            }
+                        },
+                        "trainer_advance": {
+                            "total": 111.4592239460012,
+                            "count": 18192,
+                            "self": 0.5030162169821324,
+                            "children": {
+                                "process_trajectory": {
+                                    "total": 22.219853412019347,
+                                    "count": 18192,
+                                    "self": 21.553372681019255,
+                                    "children": {
+                                        "RLTrainer._checkpoint": {
+                                            "total": 0.6664807310000924,
+                                            "count": 4,
+                                            "self": 0.6664807310000924
+                                        }
+                                    }
+                                },
+                                "_update_policy": {
+                                    "total": 88.73635431699972,
+                                    "count": 90,
+                                    "self": 47.1698457539876,
+                                    "children": {
+                                        "TorchPPOOptimizer.update": {
+                                            "total": 41.56650856301212,
+                                            "count": 4587,
+                                            "self": 41.56650856301212
+                                        }
+                                    }
+                                }
+                            }
+                        }
+                    }
+                },
+                "trainer_threads": {
+                    "total": 9.240000053978292e-07,
+                    "count": 1,
+                    "self": 9.240000053978292e-07
+                },
+                "TrainerController._save_models": {
+                    "total": 0.13212378299999727,
+                    "count": 1,
+                    "self": 0.0007380800000191812,
+                    "children": {
+                        "RLTrainer._checkpoint": {
+                            "total": 0.1313857029999781,
+                            "count": 1,
+                            "self": 0.1313857029999781
+                        }
+                    }
+                }
+            }
+        }
+    }
+}

run_logs/training_status.json ADDED Viewed

	@@ -0,0 +1,65 @@

+{
+    "SnowballTarget": {
+        "checkpoints": [
+            {
+                "steps": 49936,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-49936.onnx",
+                "reward": 16.90909090909091,
+                "creation_time": 1767604691.4502096,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-49936.pt"
+                ]
+            },
+            {
+                "steps": 99960,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-99960.onnx",
+                "reward": 21.0,
+                "creation_time": 1767604795.3609436,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-99960.pt"
+                ]
+            },
+            {
+                "steps": 149984,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-149984.onnx",
+                "reward": 23.818181818181817,
+                "creation_time": 1767604900.563291,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-149984.pt"
+                ]
+            },
+            {
+                "steps": 199984,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-199984.onnx",
+                "reward": 25.727272727272727,
+                "creation_time": 1767605004.323427,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-199984.pt"
+                ]
+            },
+            {
+                "steps": 200112,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.onnx",
+                "reward": 25.727272727272727,
+                "creation_time": 1767605004.4662263,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
+                ]
+            }
+        ],
+        "final_checkpoint": {
+            "steps": 200112,
+            "file_path": "results/SnowballTarget1/SnowballTarget.onnx",
+            "reward": 25.727272727272727,
+            "creation_time": 1767605004.4662263,
+            "auxillary_file_paths": [
+                "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
+            ]
+        }
+    },
+    "metadata": {
+        "stats_format_version": "0.3.0",
+        "mlagents_version": "0.30.0",
+        "torch_version": "1.11.0+cu102"
+    }
+}