Tyraex commited on
Commit
be590ed
·
verified ·
1 Parent(s): ad1fedd

Updated model

Browse files
Files changed (41) hide show
  1. .gitattributes +6 -0
  2. SnowballTarget.onnx +2 -2
  3. SnowballTarget/SnowballTarget-149984.onnx +3 -0
  4. SnowballTarget/SnowballTarget-149984.onnx.data +3 -0
  5. SnowballTarget/SnowballTarget-149984.pt +3 -0
  6. SnowballTarget/SnowballTarget-199984.onnx +2 -2
  7. SnowballTarget/SnowballTarget-199984.onnx.data +2 -2
  8. SnowballTarget/SnowballTarget-199984.pt +2 -2
  9. SnowballTarget/SnowballTarget-249944.onnx +3 -0
  10. SnowballTarget/SnowballTarget-249944.onnx.data +3 -0
  11. SnowballTarget/SnowballTarget-249944.pt +3 -0
  12. SnowballTarget/SnowballTarget-26400.onnx +3 -0
  13. SnowballTarget/SnowballTarget-26400.onnx.data +3 -0
  14. SnowballTarget/SnowballTarget-26400.pt +3 -0
  15. SnowballTarget/SnowballTarget-299968.onnx +3 -0
  16. SnowballTarget/SnowballTarget-299968.onnx.data +3 -0
  17. SnowballTarget/SnowballTarget-299968.pt +3 -0
  18. SnowballTarget/SnowballTarget-319192.onnx +3 -0
  19. SnowballTarget/SnowballTarget-319192.onnx.data +3 -0
  20. SnowballTarget/SnowballTarget-319192.pt +3 -0
  21. SnowballTarget/SnowballTarget-349992.onnx +3 -0
  22. SnowballTarget/SnowballTarget-349992.pt +3 -0
  23. SnowballTarget/SnowballTarget-399992.onnx +3 -0
  24. SnowballTarget/SnowballTarget-399992.pt +3 -0
  25. SnowballTarget/SnowballTarget-449952.onnx +3 -0
  26. SnowballTarget/SnowballTarget-449952.pt +3 -0
  27. SnowballTarget/SnowballTarget-49936.onnx.data +2 -2
  28. SnowballTarget/SnowballTarget-499976.onnx +3 -0
  29. SnowballTarget/SnowballTarget-499976.pt +3 -0
  30. SnowballTarget/SnowballTarget-500104.onnx +3 -0
  31. SnowballTarget/SnowballTarget-500104.pt +3 -0
  32. SnowballTarget/SnowballTarget-99960.onnx +3 -0
  33. SnowballTarget/SnowballTarget-99960.onnx.data +3 -0
  34. SnowballTarget/SnowballTarget-99960.pt +3 -0
  35. SnowballTarget/checkpoint.pt +2 -2
  36. SnowballTarget/events.out.tfevents.1760689715.auriga.367238.0 +3 -0
  37. config.json +1 -1
  38. configuration.yaml +7 -7
  39. run_logs/Player-0.log +34 -34
  40. run_logs/timers.json +179 -179
  41. run_logs/training_status.json +79 -34
.gitattributes CHANGED
@@ -38,3 +38,9 @@ SnowballTarget/SnowballTarget-199984.onnx.data filter=lfs diff=lfs merge=lfs -te
38
  SnowballTarget/SnowballTarget-200240.onnx.data filter=lfs diff=lfs merge=lfs -text
39
  SnowballTarget/SnowballTarget-49936.onnx.data filter=lfs diff=lfs merge=lfs -text
40
  SnowballTarget/SnowballTarget-99936.onnx.data filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
38
  SnowballTarget/SnowballTarget-200240.onnx.data filter=lfs diff=lfs merge=lfs -text
39
  SnowballTarget/SnowballTarget-49936.onnx.data filter=lfs diff=lfs merge=lfs -text
40
  SnowballTarget/SnowballTarget-99936.onnx.data filter=lfs diff=lfs merge=lfs -text
41
+ SnowballTarget/SnowballTarget-149984.onnx.data filter=lfs diff=lfs merge=lfs -text
42
+ SnowballTarget/SnowballTarget-249944.onnx.data filter=lfs diff=lfs merge=lfs -text
43
+ SnowballTarget/SnowballTarget-26400.onnx.data filter=lfs diff=lfs merge=lfs -text
44
+ SnowballTarget/SnowballTarget-299968.onnx.data filter=lfs diff=lfs merge=lfs -text
45
+ SnowballTarget/SnowballTarget-319192.onnx.data filter=lfs diff=lfs merge=lfs -text
46
+ SnowballTarget/SnowballTarget-99960.onnx.data filter=lfs diff=lfs merge=lfs -text
SnowballTarget.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0d4701d0ef34d1fc7767a17507b3807fade4be66ac12399835e87f76d87fcb0e
3
- size 62838
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4589ed51e34f079a3906f3250f747a0624b8421b89ffd54b7dc3495e700af4a8
3
+ size 1815958
SnowballTarget/SnowballTarget-149984.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61248c4a37f5ba55729692bfd20b7052b75628c4c88eac578927fcd5d46725f3
3
+ size 1815958
SnowballTarget/SnowballTarget-149984.onnx.data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f1f58a57041f581e0885fc989497e7b52f044f0d99a201de5e9c89f47282d7a
3
+ size 1806336
SnowballTarget/SnowballTarget-149984.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab4a02d0dfb39890c291cd11837064dab55bfff36867a1197156ccddfaffe824
3
+ size 10820443
SnowballTarget/SnowballTarget-199984.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cb48a8c4bd479ec5ba5ac4c4a73d14a72d64adbfc38b74558cf9727e74003f39
3
- size 62838
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:282fec681271870cdac8fcda4a10d50112284bccbda99999c8a799ed873fc88c
3
+ size 1815958
SnowballTarget/SnowballTarget-199984.onnx.data CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2308d3c3424c7319b4160450785ac60f43f8f50a00753b5e3afefd6cdc31576c
3
- size 641024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e1fbcc58a9fd2671b1ba8a693d374318b00e83dda6849d0aad12939de3b79db
3
+ size 1806336
SnowballTarget/SnowballTarget-199984.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1fbb0e36564ff3cf5085f6bbcef1cefd8012f0eea2b72581a18d90759184f2f6
3
- size 3850564
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9494cb348101165f11224a6d212ee1944542fddfeb0304c8e92608341d38127a
3
+ size 10820443
SnowballTarget/SnowballTarget-249944.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:770e752ca6fa4a542064d82db732601b3d5b3e3b7bf93a8c75a637308a7ba89d
3
+ size 1815958
SnowballTarget/SnowballTarget-249944.onnx.data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23a75160d7d88e5400b2326ea55287b1046cdb215f24a7923b8e23a846e15bfb
3
+ size 1806336
SnowballTarget/SnowballTarget-249944.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99184268379dd1ee0ca500027d144e351d2eba2a5e0d8d64b9df26bff0b9a578
3
+ size 10820443
SnowballTarget/SnowballTarget-26400.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65fee282d447c7cc4ef5e285e799b45cc8594295ef9267ad214bb688caabbba2
3
+ size 62831
SnowballTarget/SnowballTarget-26400.onnx.data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59511bd2ce34e2becd9fdf8606f27114c3a3719aa961d7384067a6b0f5a314b7
3
+ size 641024
SnowballTarget/SnowballTarget-26400.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bea03e38a347e1775953e556c129ac6e605bf49ed73468926a99e7a5737816b9
3
+ size 3850487
SnowballTarget/SnowballTarget-299968.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d925d859fd3f96e44bd3b77be4f99e3183dfc6f42627ef77c87229e36764091
3
+ size 1815958
SnowballTarget/SnowballTarget-299968.onnx.data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c73be9c6ac05feecfa5c2b4602afe746f3ae364c386f123bf9f4a8eda86ad4d7
3
+ size 1806336
SnowballTarget/SnowballTarget-299968.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6ebbc0244210bbf28258b3fd77de7180e451e2f8e078dd2cfb8516f09f42747
3
+ size 10820443
SnowballTarget/SnowballTarget-319192.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9941ad257489f80a635efd535f6291ec7d25cb440a398327ff349e8ffb4dc4c
3
+ size 62840
SnowballTarget/SnowballTarget-319192.onnx.data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c73be9c6ac05feecfa5c2b4602afe746f3ae364c386f123bf9f4a8eda86ad4d7
3
+ size 1806336
SnowballTarget/SnowballTarget-319192.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f043b902ee5efb4e2cd5378c9ea19cc6ab6464c9f1bb11129c331407dadde18
3
+ size 10820932
SnowballTarget/SnowballTarget-349992.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f771f58ae4d97774a39f5fd06394ee6893866c404ebe3f86f971928ae72e9b4a
3
+ size 1815958
SnowballTarget/SnowballTarget-349992.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3cf857587e3f68310126bc51c1a66a56b394bb57c5381ed3cc873cece97cf84
3
+ size 10820443
SnowballTarget/SnowballTarget-399992.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5fc58b11adcede2d1901c05598a412232e4e256a612cb11973ea76a5bc6e7d7
3
+ size 1815958
SnowballTarget/SnowballTarget-399992.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4b027b06539d83d6f9fef385d6e030a7d0fa43b53815c6c3a7399aba40b28ee
3
+ size 10820443
SnowballTarget/SnowballTarget-449952.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8cb650b9862918261a3f89214ee9412e8a81fe83ec05838ce2b8d67c3685e3aa
3
+ size 1815958
SnowballTarget/SnowballTarget-449952.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1ed0befb6667374c6461fa84fa1bc0c0788de23945e3265beaf4e560876f0bc
3
+ size 10820443
SnowballTarget/SnowballTarget-49936.onnx.data CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:12b522799ac33a2fd4cdee9ab17bfd816e955390099cffb9d2c9f461b18219e9
3
- size 641024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43b258a09cf3a6d4ea79a6f25be2cb9d633e3a3b0bc6cbc6a0fbc83554cc095a
3
+ size 1806336
SnowballTarget/SnowballTarget-499976.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4589ed51e34f079a3906f3250f747a0624b8421b89ffd54b7dc3495e700af4a8
3
+ size 1815958
SnowballTarget/SnowballTarget-499976.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec9f4fda5a0f2d3c6f54bd7ee64b7c0e0b4797fdc982935b8322fa954951af03
3
+ size 10820443
SnowballTarget/SnowballTarget-500104.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4589ed51e34f079a3906f3250f747a0624b8421b89ffd54b7dc3495e700af4a8
3
+ size 1815958
SnowballTarget/SnowballTarget-500104.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d9eecd3f09126843e7b0e79945f8c584d8d5b46d535ef3b4f66ce9871d080e2
3
+ size 10820443
SnowballTarget/SnowballTarget-99960.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d44097963c8568eddc7035817102564e028051b4e69d3f8eced5e24ddd8ec4a2
3
+ size 1815958
SnowballTarget/SnowballTarget-99960.onnx.data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f268044b2441f0b88dcd338bcd1f15ef40ba71a51a6f47540d66b71794e7020
3
+ size 1806336
SnowballTarget/SnowballTarget-99960.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94120a8366dcb8563432d9f183f145480dc6978220142f6b9c8fc988a9e88a46
3
+ size 10820368
SnowballTarget/checkpoint.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9143fc7ce327a04893636630412a2fdb6d033fcdd224455ad6d9d9385c51b934
3
- size 3849717
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff7676ef75c6780c845f1ecfc01942ee35225b343ae1ba1f74b70ed86f5b1cdc
3
+ size 10819618
SnowballTarget/events.out.tfevents.1760689715.auriga.367238.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41a3c62052f013ecb3bfb26b142bad92929b952b49f1008ee0b9256a35b5cbea
3
+ size 81505
config.json CHANGED
@@ -1 +1 @@
1
- {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 128, "buffer_size": 2048, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 50000, "network_settings": {"normalize": false, "hidden_units": 256, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "even_checkpoints": false, "max_steps": 200000, "time_horizon": 64, "summary_freq": 10000, "threaded": false, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SnowballTarget/SnowballTarget", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SnowballTarget1", "initialize_from": null, "load_model": false, "resume": true, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}
 
1
+ {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 512, "buffer_size": 32768, "learning_rate": 0.0001, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 50000, "network_settings": {"normalize": false, "hidden_units": 512, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "even_checkpoints": false, "max_steps": 500000, "time_horizon": 64, "summary_freq": 10000, "threaded": false, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SnowballTarget/SnowballTarget", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SnowballTarget1", "initialize_from": null, "load_model": false, "resume": false, "force": true, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}
configuration.yaml CHANGED
@@ -3,9 +3,9 @@ behaviors:
3
  SnowballTarget:
4
  trainer_type: ppo
5
  hyperparameters:
6
- batch_size: 128
7
- buffer_size: 2048
8
- learning_rate: 0.0003
9
  beta: 0.005
10
  epsilon: 0.2
11
  lambd: 0.95
@@ -17,7 +17,7 @@ behaviors:
17
  checkpoint_interval: 50000
18
  network_settings:
19
  normalize: false
20
- hidden_units: 256
21
  num_layers: 2
22
  vis_encode_type: simple
23
  memory: null
@@ -38,7 +38,7 @@ behaviors:
38
  init_path: null
39
  keep_checkpoints: 10
40
  even_checkpoints: false
41
- max_steps: 200000
42
  time_horizon: 64
43
  summary_freq: 10000
44
  threaded: false
@@ -69,8 +69,8 @@ checkpoint_settings:
69
  run_id: SnowballTarget1
70
  initialize_from: null
71
  load_model: false
72
- resume: true
73
- force: false
74
  train_model: false
75
  inference: false
76
  results_dir: results
 
3
  SnowballTarget:
4
  trainer_type: ppo
5
  hyperparameters:
6
+ batch_size: 512
7
+ buffer_size: 32768
8
+ learning_rate: 0.0001
9
  beta: 0.005
10
  epsilon: 0.2
11
  lambd: 0.95
 
17
  checkpoint_interval: 50000
18
  network_settings:
19
  normalize: false
20
+ hidden_units: 512
21
  num_layers: 2
22
  vis_encode_type: simple
23
  memory: null
 
38
  init_path: null
39
  keep_checkpoints: 10
40
  even_checkpoints: false
41
+ max_steps: 500000
42
  time_horizon: 64
43
  summary_freq: 10000
44
  threaded: false
 
69
  run_id: SnowballTarget1
70
  initialize_from: null
71
  load_model: false
72
+ resume: false
73
+ force: true
74
  train_model: false
75
  inference: false
76
  results_dir: results
run_logs/Player-0.log CHANGED
@@ -11,7 +11,7 @@ NullGfxDevice:
11
  Renderer: Null Device
12
  Vendor: Unity Technologies
13
  Begin MonoManager ReloadAssembly
14
- - Completed reload, in 0.093 seconds
15
  ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
16
  ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
17
  ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
@@ -22,7 +22,7 @@ ERROR: Shader Standard shader is not supported on this GPU (none of subshaders/f
22
  WARNING: Shader Unsupported: 'Standard' - All subshaders removed
23
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
24
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
25
- UnloadTime: 1.104540 ms
26
  ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
27
  requesting resize 84 x 84
28
  Setting up 24 worker threads for Enlighten.
@@ -30,16 +30,11 @@ Memory Statistics:
30
  [ALLOC_TEMP_TLS] TLS Allocator
31
  StackAllocators :
32
  [ALLOC_TEMP_MAIN]
33
- Peak usage frame count: [8.0 KB-16.0 KB]: 4031 frames, [16.0 KB-32.0 KB]: 68 frames, [2.0 MB-4.0 MB]: 1 frames
34
  Initial Block Size 4.0 MB
35
  Current Block Size 4.0 MB
36
  Peak Allocated Bytes 2.0 MB
37
  Overflow Count 0
38
- [ALLOC_TEMP_Job.Worker 19]
39
- Initial Block Size 256.0 KB
40
- Current Block Size 256.0 KB
41
- Peak Allocated Bytes 3.6 KB
42
- Overflow Count 0
43
  [ALLOC_TEMP_Job.Worker 18]
44
  Initial Block Size 256.0 KB
45
  Current Block Size 256.0 KB
@@ -55,6 +50,11 @@ Memory Statistics:
55
  Current Block Size 256.0 KB
56
  Peak Allocated Bytes 3.6 KB
57
  Overflow Count 0
 
 
 
 
 
58
  [ALLOC_TEMP_Job.Worker 44]
59
  Initial Block Size 256.0 KB
60
  Current Block Size 256.0 KB
@@ -220,12 +220,12 @@ Memory Statistics:
220
  Current Block Size 256.0 KB
221
  Peak Allocated Bytes 3.6 KB
222
  Overflow Count 0
223
- [ALLOC_TEMP_Job.Worker 21]
224
  Initial Block Size 256.0 KB
225
  Current Block Size 256.0 KB
226
  Peak Allocated Bytes 3.6 KB
227
  Overflow Count 0
228
- [ALLOC_TEMP_Job.Worker 26]
229
  Initial Block Size 256.0 KB
230
  Current Block Size 256.0 KB
231
  Peak Allocated Bytes 3.6 KB
@@ -235,7 +235,7 @@ Memory Statistics:
235
  Current Block Size 256.0 KB
236
  Peak Allocated Bytes 3.6 KB
237
  Overflow Count 0
238
- [ALLOC_TEMP_Background Job.Worker 14]
239
  Initial Block Size 32.0 KB
240
  Current Block Size 32.0 KB
241
  Peak Allocated Bytes 0 B
@@ -250,11 +250,6 @@ Memory Statistics:
250
  Current Block Size 256.0 KB
251
  Peak Allocated Bytes 3.6 KB
252
  Overflow Count 0
253
- [ALLOC_TEMP_Background Job.Worker 9]
254
- Initial Block Size 32.0 KB
255
- Current Block Size 32.0 KB
256
- Peak Allocated Bytes 0 B
257
- Overflow Count 0
258
  [ALLOC_TEMP_Job.Worker 34]
259
  Initial Block Size 256.0 KB
260
  Current Block Size 256.0 KB
@@ -265,6 +260,11 @@ Memory Statistics:
265
  Current Block Size 256.0 KB
266
  Peak Allocated Bytes 3.6 KB
267
  Overflow Count 0
 
 
 
 
 
268
  [ALLOC_TEMP_Job.Worker 29]
269
  Initial Block Size 256.0 KB
270
  Current Block Size 256.0 KB
@@ -350,12 +350,17 @@ Memory Statistics:
350
  Current Block Size 256.0 KB
351
  Peak Allocated Bytes 3.6 KB
352
  Overflow Count 0
 
 
 
 
 
353
  [ALLOC_TEMP_Job.Worker 15]
354
  Initial Block Size 256.0 KB
355
  Current Block Size 256.0 KB
356
  Peak Allocated Bytes 3.6 KB
357
  Overflow Count 0
358
- [ALLOC_TEMP_Job.Worker 24]
359
  Initial Block Size 256.0 KB
360
  Current Block Size 256.0 KB
361
  Peak Allocated Bytes 3.6 KB
@@ -370,28 +375,23 @@ Memory Statistics:
370
  Current Block Size 256.0 KB
371
  Peak Allocated Bytes 3.6 KB
372
  Overflow Count 0
373
- [ALLOC_TEMP_Loading.AsyncRead]
374
- Initial Block Size 64.0 KB
375
- Current Block Size 64.0 KB
376
- Peak Allocated Bytes 282 B
377
- Overflow Count 0
378
  [ALLOC_DEFAULT] Dual Thread Allocator
379
- Peak main deferred allocation count 36
380
  [ALLOC_BUCKET]
381
  Large Block size 4.0 MB
382
  Used Block count 1
383
  Peak Allocated bytes 1.0 MB
384
  [ALLOC_DEFAULT_MAIN]
385
- Peak usage frame count: [4.0 MB-8.0 MB]: 4100 frames
386
  Requested Block Size 16.0 MB
387
  Peak Block count 1
388
- Peak Allocated memory 6.6 MB
389
  Peak Large allocation bytes 0 B
390
  [ALLOC_DEFAULT_THREAD]
391
- Peak usage frame count: [16.0 MB-32.0 MB]: 4100 frames
392
  Requested Block Size 16.0 MB
393
  Peak Block count 1
394
- Peak Allocated memory 17.5 MB
395
  Peak Large allocation bytes 16.0 MB
396
  [ALLOC_TEMP_JOB_1_FRAME]
397
  Initial Block Size 2.0 MB
@@ -420,13 +420,13 @@ Memory Statistics:
420
  Used Block count 1
421
  Peak Allocated bytes 1.0 MB
422
  [ALLOC_GFX_MAIN]
423
- Peak usage frame count: [32.0 KB-64.0 KB]: 3482 frames, [64.0 KB-128.0 KB]: 618 frames
424
  Requested Block Size 16.0 MB
425
  Peak Block count 1
426
- Peak Allocated memory 67.3 KB
427
  Peak Large allocation bytes 0 B
428
  [ALLOC_GFX_THREAD]
429
- Peak usage frame count: [32.0 KB-64.0 KB]: 4100 frames
430
  Requested Block Size 16.0 MB
431
  Peak Block count 1
432
  Peak Allocated memory 39.6 KB
@@ -438,13 +438,13 @@ Memory Statistics:
438
  Used Block count 1
439
  Peak Allocated bytes 1.0 MB
440
  [ALLOC_CACHEOBJECTS_MAIN]
441
- Peak usage frame count: [0.5 MB-1.0 MB]: 4100 frames
442
  Requested Block Size 4.0 MB
443
  Peak Block count 1
444
  Peak Allocated memory 0.6 MB
445
  Peak Large allocation bytes 0 B
446
  [ALLOC_CACHEOBJECTS_THREAD]
447
- Peak usage frame count: [0.5 MB-1.0 MB]: 4099 frames, [2.0 MB-4.0 MB]: 1 frames
448
  Requested Block Size 4.0 MB
449
  Peak Block count 1
450
  Peak Allocated memory 2.2 MB
@@ -456,13 +456,13 @@ Memory Statistics:
456
  Used Block count 1
457
  Peak Allocated bytes 1.0 MB
458
  [ALLOC_TYPETREE_MAIN]
459
- Peak usage frame count: [0-1.0 KB]: 4100 frames
460
  Requested Block Size 2.0 MB
461
  Peak Block count 1
462
  Peak Allocated memory 1.0 KB
463
  Peak Large allocation bytes 0 B
464
  [ALLOC_TYPETREE_THREAD]
465
- Peak usage frame count: [1.0 KB-2.0 KB]: 4100 frames
466
  Requested Block Size 2.0 MB
467
  Peak Block count 1
468
  Peak Allocated memory 1.7 KB
 
11
  Renderer: Null Device
12
  Vendor: Unity Technologies
13
  Begin MonoManager ReloadAssembly
14
+ - Completed reload, in 0.099 seconds
15
  ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
16
  ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
17
  ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 
22
  WARNING: Shader Unsupported: 'Standard' - All subshaders removed
23
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
24
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
25
+ UnloadTime: 1.286488 ms
26
  ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
27
  requesting resize 84 x 84
28
  Setting up 24 worker threads for Enlighten.
 
30
  [ALLOC_TEMP_TLS] TLS Allocator
31
  StackAllocators :
32
  [ALLOC_TEMP_MAIN]
33
+ Peak usage frame count: [8.0 KB-16.0 KB]: 13412 frames, [16.0 KB-32.0 KB]: 227 frames, [2.0 MB-4.0 MB]: 1 frames
34
  Initial Block Size 4.0 MB
35
  Current Block Size 4.0 MB
36
  Peak Allocated Bytes 2.0 MB
37
  Overflow Count 0
 
 
 
 
 
38
  [ALLOC_TEMP_Job.Worker 18]
39
  Initial Block Size 256.0 KB
40
  Current Block Size 256.0 KB
 
50
  Current Block Size 256.0 KB
51
  Peak Allocated Bytes 3.6 KB
52
  Overflow Count 0
53
+ [ALLOC_TEMP_Loading.AsyncRead]
54
+ Initial Block Size 64.0 KB
55
+ Current Block Size 64.0 KB
56
+ Peak Allocated Bytes 282 B
57
+ Overflow Count 0
58
  [ALLOC_TEMP_Job.Worker 44]
59
  Initial Block Size 256.0 KB
60
  Current Block Size 256.0 KB
 
220
  Current Block Size 256.0 KB
221
  Peak Allocated Bytes 3.6 KB
222
  Overflow Count 0
223
+ [ALLOC_TEMP_Job.Worker 26]
224
  Initial Block Size 256.0 KB
225
  Current Block Size 256.0 KB
226
  Peak Allocated Bytes 3.6 KB
227
  Overflow Count 0
228
+ [ALLOC_TEMP_Job.Worker 21]
229
  Initial Block Size 256.0 KB
230
  Current Block Size 256.0 KB
231
  Peak Allocated Bytes 3.6 KB
 
235
  Current Block Size 256.0 KB
236
  Peak Allocated Bytes 3.6 KB
237
  Overflow Count 0
238
+ [ALLOC_TEMP_Background Job.Worker 9]
239
  Initial Block Size 32.0 KB
240
  Current Block Size 32.0 KB
241
  Peak Allocated Bytes 0 B
 
250
  Current Block Size 256.0 KB
251
  Peak Allocated Bytes 3.6 KB
252
  Overflow Count 0
 
 
 
 
 
253
  [ALLOC_TEMP_Job.Worker 34]
254
  Initial Block Size 256.0 KB
255
  Current Block Size 256.0 KB
 
260
  Current Block Size 256.0 KB
261
  Peak Allocated Bytes 3.6 KB
262
  Overflow Count 0
263
+ [ALLOC_TEMP_Background Job.Worker 14]
264
+ Initial Block Size 32.0 KB
265
+ Current Block Size 32.0 KB
266
+ Peak Allocated Bytes 0 B
267
+ Overflow Count 0
268
  [ALLOC_TEMP_Job.Worker 29]
269
  Initial Block Size 256.0 KB
270
  Current Block Size 256.0 KB
 
350
  Current Block Size 256.0 KB
351
  Peak Allocated Bytes 3.6 KB
352
  Overflow Count 0
353
+ [ALLOC_TEMP_Job.Worker 24]
354
+ Initial Block Size 256.0 KB
355
+ Current Block Size 256.0 KB
356
+ Peak Allocated Bytes 3.6 KB
357
+ Overflow Count 0
358
  [ALLOC_TEMP_Job.Worker 15]
359
  Initial Block Size 256.0 KB
360
  Current Block Size 256.0 KB
361
  Peak Allocated Bytes 3.6 KB
362
  Overflow Count 0
363
+ [ALLOC_TEMP_Job.Worker 19]
364
  Initial Block Size 256.0 KB
365
  Current Block Size 256.0 KB
366
  Peak Allocated Bytes 3.6 KB
 
375
  Current Block Size 256.0 KB
376
  Peak Allocated Bytes 3.6 KB
377
  Overflow Count 0
 
 
 
 
 
378
  [ALLOC_DEFAULT] Dual Thread Allocator
379
+ Peak main deferred allocation count 44
380
  [ALLOC_BUCKET]
381
  Large Block size 4.0 MB
382
  Used Block count 1
383
  Peak Allocated bytes 1.0 MB
384
  [ALLOC_DEFAULT_MAIN]
385
+ Peak usage frame count: [4.0 MB-8.0 MB]: 9983 frames, [8.0 MB-16.0 MB]: 3657 frames
386
  Requested Block Size 16.0 MB
387
  Peak Block count 1
388
+ Peak Allocated memory 9.9 MB
389
  Peak Large allocation bytes 0 B
390
  [ALLOC_DEFAULT_THREAD]
391
+ Peak usage frame count: [16.0 MB-32.0 MB]: 13640 frames
392
  Requested Block Size 16.0 MB
393
  Peak Block count 1
394
+ Peak Allocated memory 17.4 MB
395
  Peak Large allocation bytes 16.0 MB
396
  [ALLOC_TEMP_JOB_1_FRAME]
397
  Initial Block Size 2.0 MB
 
420
  Used Block count 1
421
  Peak Allocated bytes 1.0 MB
422
  [ALLOC_GFX_MAIN]
423
+ Peak usage frame count: [32.0 KB-64.0 KB]: 10849 frames, [64.0 KB-128.0 KB]: 2791 frames
424
  Requested Block Size 16.0 MB
425
  Peak Block count 1
426
+ Peak Allocated memory 67.2 KB
427
  Peak Large allocation bytes 0 B
428
  [ALLOC_GFX_THREAD]
429
+ Peak usage frame count: [32.0 KB-64.0 KB]: 13640 frames
430
  Requested Block Size 16.0 MB
431
  Peak Block count 1
432
  Peak Allocated memory 39.6 KB
 
438
  Used Block count 1
439
  Peak Allocated bytes 1.0 MB
440
  [ALLOC_CACHEOBJECTS_MAIN]
441
+ Peak usage frame count: [0.5 MB-1.0 MB]: 13640 frames
442
  Requested Block Size 4.0 MB
443
  Peak Block count 1
444
  Peak Allocated memory 0.6 MB
445
  Peak Large allocation bytes 0 B
446
  [ALLOC_CACHEOBJECTS_THREAD]
447
+ Peak usage frame count: [0.5 MB-1.0 MB]: 13639 frames, [2.0 MB-4.0 MB]: 1 frames
448
  Requested Block Size 4.0 MB
449
  Peak Block count 1
450
  Peak Allocated memory 2.2 MB
 
456
  Used Block count 1
457
  Peak Allocated bytes 1.0 MB
458
  [ALLOC_TYPETREE_MAIN]
459
+ Peak usage frame count: [0-1.0 KB]: 13640 frames
460
  Requested Block Size 2.0 MB
461
  Peak Block count 1
462
  Peak Allocated memory 1.0 KB
463
  Peak Large allocation bytes 0 B
464
  [ALLOC_TYPETREE_THREAD]
465
+ Peak usage frame count: [1.0 KB-2.0 KB]: 13640 frames
466
  Requested Block Size 2.0 MB
467
  Peak Block count 1
468
  Peak Allocated memory 1.7 KB
run_logs/timers.json CHANGED
@@ -2,213 +2,213 @@
2
  "name": "root",
3
  "gauges": {
4
  "SnowballTarget.Policy.Entropy.mean": {
5
- "value": 0.9344794154167175,
6
- "min": 0.9344794154167175,
7
- "max": 2.153480291366577,
8
- "count": 16
9
  },
10
  "SnowballTarget.Policy.Entropy.sum": {
11
- "value": 8963.5263671875,
12
- "min": 1516.0501708984375,
13
- "max": 19536.798828125,
14
- "count": 16
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
15
  },
16
  "SnowballTarget.IsTraining.mean": {
17
  "value": 1.0,
18
  "min": 1.0,
19
  "max": 1.0,
20
- "count": 16
21
  },
22
  "SnowballTarget.IsTraining.sum": {
23
  "value": 1.0,
24
  "min": 1.0,
25
  "max": 1.0,
26
- "count": 16
27
- },
28
- "SnowballTarget.Step.mean": {
29
- "value": 199984.0,
30
- "min": 59952.0,
31
- "max": 199984.0,
32
- "count": 15
33
- },
34
- "SnowballTarget.Step.sum": {
35
- "value": 199984.0,
36
- "min": 59952.0,
37
- "max": 199984.0,
38
- "count": 15
39
- },
40
- "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
41
- "value": 12.326292037963867,
42
- "min": 5.530655384063721,
43
- "max": 12.326292037963867,
44
- "count": 15
45
- },
46
- "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
47
- "value": 2526.889892578125,
48
- "min": 1078.477783203125,
49
- "max": 2526.889892578125,
50
- "count": 15
51
  },
52
  "SnowballTarget.Losses.PolicyLoss.mean": {
53
- "value": 0.07485539761837573,
54
- "min": 0.0676656143312036,
55
- "max": 0.07485539761837573,
56
  "count": 15
57
  },
58
  "SnowballTarget.Losses.PolicyLoss.sum": {
59
- "value": 0.37427698809187865,
60
- "min": 0.2706624573248144,
61
- "max": 0.37427698809187865,
62
  "count": 15
63
  },
64
  "SnowballTarget.Losses.ValueLoss.mean": {
65
- "value": 0.176937632058181,
66
- "min": 0.176937632058181,
67
- "max": 0.2733584906969804,
68
  "count": 15
69
  },
70
  "SnowballTarget.Losses.ValueLoss.sum": {
71
- "value": 0.884688160290905,
72
- "min": 0.7650682372497578,
73
- "max": 1.3637838930475945,
74
  "count": 15
75
  },
76
  "SnowballTarget.Policy.LearningRate.mean": {
77
- "value": 7.428097524e-06,
78
- "min": 7.428097524e-06,
79
- "max": 0.000216978027674,
80
  "count": 15
81
  },
82
  "SnowballTarget.Policy.LearningRate.sum": {
83
- "value": 3.714048762e-05,
84
- "min": 3.714048762e-05,
85
- "max": 0.00101064016312,
86
  "count": 15
87
  },
88
  "SnowballTarget.Policy.Epsilon.mean": {
89
- "value": 0.10247600000000001,
90
- "min": 0.10247600000000001,
91
- "max": 0.172326,
92
  "count": 15
93
  },
94
  "SnowballTarget.Policy.Epsilon.sum": {
95
- "value": 0.5123800000000001,
96
- "min": 0.429704,
97
- "max": 0.8368800000000001,
98
  "count": 15
99
  },
100
  "SnowballTarget.Policy.Beta.mean": {
101
- "value": 0.00013355240000000005,
102
- "min": 0.00013355240000000005,
103
- "max": 0.0036190674000000003,
104
  "count": 15
105
  },
106
  "SnowballTarget.Policy.Beta.sum": {
107
- "value": 0.0006677620000000002,
108
- "min": 0.0006677620000000002,
109
- "max": 0.016860312000000002,
110
- "count": 15
111
- },
112
- "SnowballTarget.Environment.EpisodeLength.mean": {
113
- "value": 199.0,
114
- "min": 199.0,
115
- "max": 199.0,
116
- "count": 15
117
- },
118
- "SnowballTarget.Environment.EpisodeLength.sum": {
119
- "value": 10945.0,
120
- "min": 8756.0,
121
- "max": 10945.0,
122
- "count": 15
123
- },
124
- "SnowballTarget.Environment.CumulativeReward.mean": {
125
- "value": 24.30909090909091,
126
- "min": 14.772727272727273,
127
- "max": 24.30909090909091,
128
- "count": 15
129
- },
130
- "SnowballTarget.Environment.CumulativeReward.sum": {
131
- "value": 1337.0,
132
- "min": 650.0,
133
- "max": 1337.0,
134
- "count": 15
135
- },
136
- "SnowballTarget.Policy.ExtrinsicReward.mean": {
137
- "value": 24.30909090909091,
138
- "min": 14.772727272727273,
139
- "max": 24.30909090909091,
140
- "count": 15
141
- },
142
- "SnowballTarget.Policy.ExtrinsicReward.sum": {
143
- "value": 1337.0,
144
- "min": 650.0,
145
- "max": 1337.0,
146
  "count": 15
147
  }
148
  },
149
  "metadata": {
150
  "timer_format_version": "0.1.0",
151
- "start_time_seconds": "1760687063",
152
  "python_version": "3.10.12 (main, Aug 15 2025, 14:32:43) [GCC 11.4.0]",
153
- "command_line_arguments": "/local_scratch/ahmohame/MyRLProj/.venv/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget1 --no-graphics --resume",
154
  "mlagents_version": "1.2.0.dev0",
155
  "mlagents_envs_version": "1.2.0.dev0",
156
  "communication_protocol_version": "1.5.0",
157
- "pytorch_version": "2.9.0+cu128",
158
  "numpy_version": "1.23.5",
159
- "end_time_seconds": "1760687495"
160
  },
161
- "total": 432.1884180130437,
162
  "count": 1,
163
- "self": 0.37457607907708734,
164
  "children": {
165
  "run_training.setup": {
166
- "total": 0.026659096009097993,
167
  "count": 1,
168
- "self": 0.026659096009097993
169
  },
170
  "TrainerController.start_learning": {
171
- "total": 431.7871828379575,
172
  "count": 1,
173
- "self": 0.19716291455551982,
174
  "children": {
175
  "TrainerController._reset_env": {
176
- "total": 2.315003640949726,
177
  "count": 1,
178
- "self": 2.315003640949726
179
  },
180
  "TrainerController.advance": {
181
- "total": 427.82484198745806,
182
- "count": 13664,
183
- "self": 0.20069539861287922,
184
  "children": {
185
  "env_step": {
186
- "total": 310.37624442589004,
187
- "count": 13664,
188
- "self": 271.7278343383223,
189
  "children": {
190
  "SubprocessEnvManager._take_step": {
191
- "total": 38.51920480164699,
192
- "count": 13664,
193
- "self": 0.6734598745824769,
194
  "children": {
195
  "TorchPolicy.evaluate": {
196
- "total": 37.845744927064516,
197
- "count": 13664,
198
- "self": 37.845744927064516
199
  }
200
  }
201
  },
202
  "workers": {
203
- "total": 0.12920528592076153,
204
- "count": 13664,
205
  "self": 0.0,
206
  "children": {
207
  "worker_root": {
208
- "total": 428.1941619500285,
209
- "count": 13664,
210
  "is_parallel": true,
211
- "self": 178.94030459946953,
212
  "children": {
213
  "run_training.setup": {
214
  "total": 0.0,
@@ -217,48 +217,48 @@
217
  "self": 0.0,
218
  "children": {
219
  "steps_from_proto": {
220
- "total": 0.004295137012377381,
221
  "count": 1,
222
  "is_parallel": true,
223
- "self": 0.0011666940990835428,
224
  "children": {
225
  "_process_rank_one_or_two_observation": {
226
- "total": 0.0031284429132938385,
227
  "count": 10,
228
  "is_parallel": true,
229
- "self": 0.0031284429132938385
230
  }
231
  }
232
  },
233
  "UnityEnvironment.step": {
234
- "total": 0.04597055108752102,
235
  "count": 1,
236
  "is_parallel": true,
237
- "self": 0.0008726851083338261,
238
  "children": {
239
  "UnityEnvironment._generate_step_input": {
240
- "total": 0.0006993829738348722,
241
  "count": 1,
242
  "is_parallel": true,
243
- "self": 0.0006993829738348722
244
  },
245
  "communicator.exchange": {
246
- "total": 0.04149426205549389,
247
  "count": 1,
248
  "is_parallel": true,
249
- "self": 0.04149426205549389
250
  },
251
  "steps_from_proto": {
252
- "total": 0.002904220949858427,
253
  "count": 1,
254
  "is_parallel": true,
255
- "self": 0.0005674530984833837,
256
  "children": {
257
  "_process_rank_one_or_two_observation": {
258
- "total": 0.0023367678513750434,
259
  "count": 10,
260
  "is_parallel": true,
261
- "self": 0.0023367678513750434
262
  }
263
  }
264
  }
@@ -267,34 +267,34 @@
267
  }
268
  },
269
  "UnityEnvironment.step": {
270
- "total": 249.25385735055897,
271
- "count": 13663,
272
  "is_parallel": true,
273
- "self": 9.961991776013747,
274
  "children": {
275
  "UnityEnvironment._generate_step_input": {
276
- "total": 6.230835664086044,
277
- "count": 13663,
278
  "is_parallel": true,
279
- "self": 6.230835664086044
280
  },
281
  "communicator.exchange": {
282
- "total": 201.06483742501587,
283
- "count": 13663,
284
  "is_parallel": true,
285
- "self": 201.06483742501587
286
  },
287
  "steps_from_proto": {
288
- "total": 31.996192485443316,
289
- "count": 13663,
290
  "is_parallel": true,
291
- "self": 6.077628318686038,
292
  "children": {
293
  "_process_rank_one_or_two_observation": {
294
- "total": 25.918564166757278,
295
- "count": 136630,
296
  "is_parallel": true,
297
- "self": 25.918564166757278
298
  }
299
  }
300
  }
@@ -307,31 +307,31 @@
307
  }
308
  },
309
  "trainer_advance": {
310
- "total": 117.24790216295514,
311
- "count": 13664,
312
- "self": 0.27291102579329163,
313
  "children": {
314
  "process_trajectory": {
315
- "total": 23.37360843643546,
316
- "count": 13664,
317
- "self": 15.879194783512503,
318
  "children": {
319
  "RLTrainer._checkpoint": {
320
- "total": 7.494413652922958,
321
- "count": 4,
322
- "self": 7.494413652922958
323
  }
324
  }
325
  },
326
  "_update_policy": {
327
- "total": 93.60138270072639,
328
- "count": 68,
329
- "self": 23.973814754164778,
330
  "children": {
331
  "TorchPPOOptimizer.update": {
332
- "total": 69.62756794656161,
333
- "count": 3465,
334
- "self": 69.62756794656161
335
  }
336
  }
337
  }
@@ -340,19 +340,19 @@
340
  }
341
  },
342
  "trainer_threads": {
343
- "total": 9.710201993584633e-07,
344
  "count": 1,
345
- "self": 9.710201993584633e-07
346
  },
347
  "TrainerController._save_models": {
348
- "total": 1.4501733239740133,
349
  "count": 1,
350
- "self": 0.0005577360279858112,
351
  "children": {
352
  "RLTrainer._checkpoint": {
353
- "total": 1.4496155879460275,
354
  "count": 1,
355
- "self": 1.4496155879460275
356
  }
357
  }
358
  }
 
2
  "name": "root",
3
  "gauges": {
4
  "SnowballTarget.Policy.Entropy.mean": {
5
+ "value": 1.8568122386932373,
6
+ "min": 1.8568122386932373,
7
+ "max": 2.8903470039367676,
8
+ "count": 50
9
  },
10
  "SnowballTarget.Policy.Entropy.sum": {
11
+ "value": 17810.54296875,
12
+ "min": 17775.48046875,
13
+ "max": 29759.01171875,
14
+ "count": 50
15
+ },
16
+ "SnowballTarget.Step.mean": {
17
+ "value": 499976.0,
18
+ "min": 9952.0,
19
+ "max": 499976.0,
20
+ "count": 50
21
+ },
22
+ "SnowballTarget.Step.sum": {
23
+ "value": 499976.0,
24
+ "min": 9952.0,
25
+ "max": 499976.0,
26
+ "count": 50
27
+ },
28
+ "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
29
+ "value": 6.018762111663818,
30
+ "min": -0.017574388533830643,
31
+ "max": 6.018762111663818,
32
+ "count": 50
33
+ },
34
+ "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
35
+ "value": 1233.84619140625,
36
+ "min": -3.602749824523926,
37
+ "max": 1233.84619140625,
38
+ "count": 50
39
+ },
40
+ "SnowballTarget.Environment.EpisodeLength.mean": {
41
+ "value": 199.0,
42
+ "min": 199.0,
43
+ "max": 199.0,
44
+ "count": 50
45
+ },
46
+ "SnowballTarget.Environment.EpisodeLength.sum": {
47
+ "value": 10945.0,
48
+ "min": 8756.0,
49
+ "max": 10945.0,
50
+ "count": 50
51
+ },
52
+ "SnowballTarget.Environment.CumulativeReward.mean": {
53
+ "value": 17.672727272727272,
54
+ "min": 2.727272727272727,
55
+ "max": 18.181818181818183,
56
+ "count": 50
57
+ },
58
+ "SnowballTarget.Environment.CumulativeReward.sum": {
59
+ "value": 972.0,
60
+ "min": 120.0,
61
+ "max": 972.0,
62
+ "count": 50
63
+ },
64
+ "SnowballTarget.Policy.ExtrinsicReward.mean": {
65
+ "value": 17.672727272727272,
66
+ "min": 2.727272727272727,
67
+ "max": 18.181818181818183,
68
+ "count": 50
69
+ },
70
+ "SnowballTarget.Policy.ExtrinsicReward.sum": {
71
+ "value": 972.0,
72
+ "min": 120.0,
73
+ "max": 972.0,
74
+ "count": 50
75
  },
76
  "SnowballTarget.IsTraining.mean": {
77
  "value": 1.0,
78
  "min": 1.0,
79
  "max": 1.0,
80
+ "count": 50
81
  },
82
  "SnowballTarget.IsTraining.sum": {
83
  "value": 1.0,
84
  "min": 1.0,
85
  "max": 1.0,
86
+ "count": 50
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
87
  },
88
  "SnowballTarget.Losses.PolicyLoss.mean": {
89
+ "value": 0.035475623733418615,
90
+ "min": 0.03180414954922147,
91
+ "max": 0.03817954923768715,
92
  "count": 15
93
  },
94
  "SnowballTarget.Losses.PolicyLoss.sum": {
95
+ "value": 0.035475623733418615,
96
+ "min": 0.03180414954922147,
97
+ "max": 0.03817954923768715,
98
  "count": 15
99
  },
100
  "SnowballTarget.Losses.ValueLoss.mean": {
101
+ "value": 0.3183900256020327,
102
+ "min": 0.08703206747304648,
103
+ "max": 0.3183900256020327,
104
  "count": 15
105
  },
106
  "SnowballTarget.Losses.ValueLoss.sum": {
107
+ "value": 0.3183900256020327,
108
+ "min": 0.08703206747304648,
109
+ "max": 0.3183900256020327,
110
  "count": 15
111
  },
112
  "SnowballTarget.Policy.LearningRate.mean": {
113
+ "value": 1.0176989823999964e-06,
114
+ "min": 1.0176989823999964e-06,
115
+ "max": 9.341760658240001e-05,
116
  "count": 15
117
  },
118
  "SnowballTarget.Policy.LearningRate.sum": {
119
+ "value": 1.0176989823999964e-06,
120
+ "min": 1.0176989823999964e-06,
121
+ "max": 9.341760658240001e-05,
122
  "count": 15
123
  },
124
  "SnowballTarget.Policy.Epsilon.mean": {
125
+ "value": 0.10101760000000003,
126
+ "min": 0.10101760000000003,
127
+ "max": 0.19341760000000005,
128
  "count": 15
129
  },
130
  "SnowballTarget.Policy.Epsilon.sum": {
131
+ "value": 0.10101760000000003,
132
+ "min": 0.10101760000000003,
133
+ "max": 0.19341760000000005,
134
  "count": 15
135
  },
136
  "SnowballTarget.Policy.Beta.mean": {
137
+ "value": 6.077823999999984e-05,
138
+ "min": 6.077823999999984e-05,
139
+ "max": 0.004671538240000001,
140
  "count": 15
141
  },
142
  "SnowballTarget.Policy.Beta.sum": {
143
+ "value": 6.077823999999984e-05,
144
+ "min": 6.077823999999984e-05,
145
+ "max": 0.004671538240000001,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
146
  "count": 15
147
  }
148
  },
149
  "metadata": {
150
  "timer_format_version": "0.1.0",
151
+ "start_time_seconds": "1760689714",
152
  "python_version": "3.10.12 (main, Aug 15 2025, 14:32:43) [GCC 11.4.0]",
153
+ "command_line_arguments": "/local_scratch/ahmohame/MyRLProj/.venv/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget1 --no-graphics --force",
154
  "mlagents_version": "1.2.0.dev0",
155
  "mlagents_envs_version": "1.2.0.dev0",
156
  "communication_protocol_version": "1.5.0",
157
+ "pytorch_version": "2.3.1+cu121",
158
  "numpy_version": "1.23.5",
159
+ "end_time_seconds": "1760690960"
160
  },
161
+ "total": 1246.1255109719932,
162
  "count": 1,
163
+ "self": 0.374010790954344,
164
  "children": {
165
  "run_training.setup": {
166
+ "total": 0.02128842705860734,
167
  "count": 1,
168
+ "self": 0.02128842705860734
169
  },
170
  "TrainerController.start_learning": {
171
+ "total": 1245.7302117539803,
172
  "count": 1,
173
+ "self": 0.6739412506576627,
174
  "children": {
175
  "TrainerController._reset_env": {
176
+ "total": 2.9158263229765,
177
  "count": 1,
178
+ "self": 2.9158263229765
179
  },
180
  "TrainerController.advance": {
181
+ "total": 1242.0460719174007,
182
+ "count": 45464,
183
+ "self": 0.6814981006318703,
184
  "children": {
185
  "env_step": {
186
+ "total": 1054.3282872018171,
187
+ "count": 45464,
188
+ "self": 919.0131197725423,
189
  "children": {
190
  "SubprocessEnvManager._take_step": {
191
+ "total": 134.8636818312807,
192
+ "count": 45464,
193
+ "self": 2.2304799418197945,
194
  "children": {
195
  "TorchPolicy.evaluate": {
196
+ "total": 132.6332018894609,
197
+ "count": 45464,
198
+ "self": 132.6332018894609
199
  }
200
  }
201
  },
202
  "workers": {
203
+ "total": 0.45148559799417853,
204
+ "count": 45464,
205
  "self": 0.0,
206
  "children": {
207
  "worker_root": {
208
+ "total": 1243.1112274315674,
209
+ "count": 45464,
210
  "is_parallel": true,
211
+ "self": 398.501711131772,
212
  "children": {
213
  "run_training.setup": {
214
  "total": 0.0,
 
217
  "self": 0.0,
218
  "children": {
219
  "steps_from_proto": {
220
+ "total": 0.00440782296936959,
221
  "count": 1,
222
  "is_parallel": true,
223
+ "self": 0.0011371220462024212,
224
  "children": {
225
  "_process_rank_one_or_two_observation": {
226
+ "total": 0.003270700923167169,
227
  "count": 10,
228
  "is_parallel": true,
229
+ "self": 0.003270700923167169
230
  }
231
  }
232
  },
233
  "UnityEnvironment.step": {
234
+ "total": 0.04261121794115752,
235
  "count": 1,
236
  "is_parallel": true,
237
+ "self": 0.0009077248396351933,
238
  "children": {
239
  "UnityEnvironment._generate_step_input": {
240
+ "total": 0.0006594400620087981,
241
  "count": 1,
242
  "is_parallel": true,
243
+ "self": 0.0006594400620087981
244
  },
245
  "communicator.exchange": {
246
+ "total": 0.03817833599168807,
247
  "count": 1,
248
  "is_parallel": true,
249
+ "self": 0.03817833599168807
250
  },
251
  "steps_from_proto": {
252
+ "total": 0.0028657170478254557,
253
  "count": 1,
254
  "is_parallel": true,
255
+ "self": 0.0005921600386500359,
256
  "children": {
257
  "_process_rank_one_or_two_observation": {
258
+ "total": 0.00227355700917542,
259
  "count": 10,
260
  "is_parallel": true,
261
+ "self": 0.00227355700917542
262
  }
263
  }
264
  }
 
267
  }
268
  },
269
  "UnityEnvironment.step": {
270
+ "total": 844.6095162997954,
271
+ "count": 45463,
272
  "is_parallel": true,
273
+ "self": 35.7958256395068,
274
  "children": {
275
  "UnityEnvironment._generate_step_input": {
276
+ "total": 21.017438556067646,
277
+ "count": 45463,
278
  "is_parallel": true,
279
+ "self": 21.017438556067646
280
  },
281
  "communicator.exchange": {
282
+ "total": 676.2517781199422,
283
+ "count": 45463,
284
  "is_parallel": true,
285
+ "self": 676.2517781199422
286
  },
287
  "steps_from_proto": {
288
+ "total": 111.54447398427874,
289
+ "count": 45463,
290
  "is_parallel": true,
291
+ "self": 21.141052892548032,
292
  "children": {
293
  "_process_rank_one_or_two_observation": {
294
+ "total": 90.4034210917307,
295
+ "count": 454630,
296
  "is_parallel": true,
297
+ "self": 90.4034210917307
298
  }
299
  }
300
  }
 
307
  }
308
  },
309
  "trainer_advance": {
310
+ "total": 187.03628661495168,
311
+ "count": 45464,
312
+ "self": 0.7960933083668351,
313
  "children": {
314
  "process_trajectory": {
315
+ "total": 50.32543419068679,
316
+ "count": 45464,
317
+ "self": 49.403155541745946,
318
  "children": {
319
  "RLTrainer._checkpoint": {
320
+ "total": 0.9222786489408463,
321
+ "count": 10,
322
+ "self": 0.9222786489408463
323
  }
324
  }
325
  },
326
  "_update_policy": {
327
+ "total": 135.91475911589805,
328
+ "count": 15,
329
+ "self": 79.53988587856293,
330
  "children": {
331
  "TorchPPOOptimizer.update": {
332
+ "total": 56.37487323733512,
333
+ "count": 2880,
334
+ "self": 56.37487323733512
335
  }
336
  }
337
  }
 
340
  }
341
  },
342
  "trainer_threads": {
343
+ "total": 8.719507604837418e-07,
344
  "count": 1,
345
+ "self": 8.719507604837418e-07
346
  },
347
  "TrainerController._save_models": {
348
+ "total": 0.0943713909946382,
349
  "count": 1,
350
+ "self": 0.0012160909827798605,
351
  "children": {
352
  "RLTrainer._checkpoint": {
353
+ "total": 0.09315530001185834,
354
  "count": 1,
355
+ "self": 0.09315530001185834
356
  }
357
  }
358
  }
run_logs/training_status.json CHANGED
@@ -1,65 +1,110 @@
1
  {
2
- "metadata": {
3
- "stats_format_version": "0.3.0",
4
- "mlagents_version": "1.2.0.dev0",
5
- "torch_version": "2.9.0+cu128"
6
- },
7
  "SnowballTarget": {
8
  "checkpoints": [
9
  {
10
- "steps": 49936,
11
- "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-49936.onnx",
12
- "reward": null,
13
- "creation_time": 1760687071.1677175,
14
  "auxillary_file_paths": [
15
- "results/SnowballTarget1/SnowballTarget/SnowballTarget-49936.pt"
16
  ]
17
  },
18
  {
19
- "steps": 99936,
20
- "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-99936.onnx",
21
- "reward": 19.90909090909091,
22
- "creation_time": 1760687214.6778388,
23
  "auxillary_file_paths": [
24
- "results/SnowballTarget1/SnowballTarget/SnowballTarget-99936.pt"
25
  ]
26
  },
27
  {
28
- "steps": 149960,
29
- "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-149960.onnx",
30
- "reward": 23.727272727272727,
31
- "creation_time": 1760687348.7690995,
32
  "auxillary_file_paths": [
33
- "results/SnowballTarget1/SnowballTarget/SnowballTarget-149960.pt"
34
  ]
35
  },
36
  {
37
- "steps": 199984,
38
- "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-199984.onnx",
39
- "reward": 25.181818181818183,
40
- "creation_time": 1760687494.144507,
41
  "auxillary_file_paths": [
42
- "results/SnowballTarget1/SnowballTarget/SnowballTarget-199984.pt"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
43
  ]
44
  },
45
  {
46
- "steps": 200240,
47
- "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-200240.onnx",
48
- "reward": 25.181818181818183,
49
- "creation_time": 1760687495.6147425,
50
  "auxillary_file_paths": [
51
- "results/SnowballTarget1/SnowballTarget/SnowballTarget-200240.pt"
 
 
 
 
 
 
 
 
 
52
  ]
53
  }
54
  ],
55
  "final_checkpoint": {
56
- "steps": 200240,
57
  "file_path": "results/SnowballTarget1/SnowballTarget.onnx",
58
- "reward": 25.181818181818183,
59
- "creation_time": 1760687495.6147425,
60
  "auxillary_file_paths": [
61
- "results/SnowballTarget1/SnowballTarget/SnowballTarget-200240.pt"
62
  ]
63
  }
 
 
 
 
 
64
  }
65
  }
 
1
  {
 
 
 
 
 
2
  "SnowballTarget": {
3
  "checkpoints": [
4
  {
5
+ "steps": 99960,
6
+ "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-99960.onnx",
7
+ "reward": 4.2727272727272725,
8
+ "creation_time": 1760689965.875995,
9
  "auxillary_file_paths": [
10
+ "results/SnowballTarget1/SnowballTarget/SnowballTarget-99960.pt"
11
  ]
12
  },
13
  {
14
+ "steps": 149984,
15
+ "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-149984.onnx",
16
+ "reward": 8.373737373737374,
17
+ "creation_time": 1760690084.296909,
18
  "auxillary_file_paths": [
19
+ "results/SnowballTarget1/SnowballTarget/SnowballTarget-149984.pt"
20
  ]
21
  },
22
  {
23
+ "steps": 199984,
24
+ "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-199984.onnx",
25
+ "reward": 10.363636363636363,
26
+ "creation_time": 1760690215.7909374,
27
  "auxillary_file_paths": [
28
+ "results/SnowballTarget1/SnowballTarget/SnowballTarget-199984.pt"
29
  ]
30
  },
31
  {
32
+ "steps": 249944,
33
+ "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-249944.onnx",
34
+ "reward": 12.494949494949495,
35
+ "creation_time": 1760690337.2152503,
36
  "auxillary_file_paths": [
37
+ "results/SnowballTarget1/SnowballTarget/SnowballTarget-249944.pt"
38
+ ]
39
+ },
40
+ {
41
+ "steps": 299968,
42
+ "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-299968.onnx",
43
+ "reward": 13.272727272727273,
44
+ "creation_time": 1760690461.3641863,
45
+ "auxillary_file_paths": [
46
+ "results/SnowballTarget1/SnowballTarget/SnowballTarget-299968.pt"
47
+ ]
48
+ },
49
+ {
50
+ "steps": 349992,
51
+ "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-349992.onnx",
52
+ "reward": 14.745454545454546,
53
+ "creation_time": 1760690583.665323,
54
+ "auxillary_file_paths": [
55
+ "results/SnowballTarget1/SnowballTarget/SnowballTarget-349992.pt"
56
+ ]
57
+ },
58
+ {
59
+ "steps": 399992,
60
+ "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-399992.onnx",
61
+ "reward": 16.727272727272727,
62
+ "creation_time": 1760690704.0682063,
63
+ "auxillary_file_paths": [
64
+ "results/SnowballTarget1/SnowballTarget/SnowballTarget-399992.pt"
65
+ ]
66
+ },
67
+ {
68
+ "steps": 449952,
69
+ "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-449952.onnx",
70
+ "reward": 17.263636363636362,
71
+ "creation_time": 1760690823.7661152,
72
+ "auxillary_file_paths": [
73
+ "results/SnowballTarget1/SnowballTarget/SnowballTarget-449952.pt"
74
  ]
75
  },
76
  {
77
+ "steps": 499976,
78
+ "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-499976.onnx",
79
+ "reward": 18.272727272727273,
80
+ "creation_time": 1760690960.1838775,
81
  "auxillary_file_paths": [
82
+ "results/SnowballTarget1/SnowballTarget/SnowballTarget-499976.pt"
83
+ ]
84
+ },
85
+ {
86
+ "steps": 500104,
87
+ "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-500104.onnx",
88
+ "reward": 18.272727272727273,
89
+ "creation_time": 1760690960.2877028,
90
+ "auxillary_file_paths": [
91
+ "results/SnowballTarget1/SnowballTarget/SnowballTarget-500104.pt"
92
  ]
93
  }
94
  ],
95
  "final_checkpoint": {
96
+ "steps": 500104,
97
  "file_path": "results/SnowballTarget1/SnowballTarget.onnx",
98
+ "reward": 18.272727272727273,
99
+ "creation_time": 1760690960.2877028,
100
  "auxillary_file_paths": [
101
+ "results/SnowballTarget1/SnowballTarget/SnowballTarget-500104.pt"
102
  ]
103
  }
104
+ },
105
+ "metadata": {
106
+ "stats_format_version": "0.3.0",
107
+ "mlagents_version": "1.2.0.dev0",
108
+ "torch_version": "2.3.1+cu121"
109
  }
110
  }