Huggy

Browse files

Files changed (5) hide show

README.md +22 -18
config.json +1 -1
configuration.yaml +7 -3
run_logs/timers.json +20 -342
run_logs/training_status.json +2 -114

README.md CHANGED Viewed

@@ -1,31 +1,35 @@
 ---
-      tags:
-      - unity-ml-agents
-      - ml-agents
-      - deep-reinforcement-learning
-      - reinforcement-learning
-      - ML-Agents-Huggy
-      library_name: ml-agents
 ---
   # **ppo** Agent playing **Huggy**
-  This is a trained model of a **ppo** agent playing **Huggy** using the [Unity ML-Agents Library](https://github.com/Unity-Technologies/ml-agents).
   ## Usage (with ML-Agents)
-  The Documentation: https://github.com/huggingface/ml-agents#get-started
-  We wrote a complete tutorial to learn to train your first agent using ML-Agents and publish it to the Hub:
   ### Resume the training
-  ```
   mlagents-learn <your_configuration_file_path.yaml> --run-id=<run_id> --resume
   ```
   ### Watch your Agent play
-  You can watch your agent **playing directly in your browser:**.
-  1. Go to https://huggingface.co/spaces/unity/ML-Agents-Huggy
-  2. Step 1: Write your model_id: azaazato/ppo-Huggy
   3. Step 2: Select your *.nn /*.onnx file
   4. Click on Watch the agent play 👀

 ---
+library_name: ml-agents
+tags:
+- Huggy
+- deep-reinforcement-learning
+- reinforcement-learning
+- ML-Agents-Huggy
 ---
   # **ppo** Agent playing **Huggy**
+  This is a trained model of a **ppo** agent playing **Huggy**
+  using the [Unity ML-Agents Library](https://github.com/Unity-Technologies/ml-agents).
   ## Usage (with ML-Agents)
+  The Documentation: https://unity-technologies.github.io/ml-agents/ML-Agents-Toolkit-Documentation/
+  We wrote a complete tutorial to learn to train your first agent using ML-Agents and publish it to the Hub:
+  - A *short tutorial* where you teach Huggy the Dog 🐶 to fetch the stick and then play with him directly in your
+  browser: https://huggingface.co/learn/deep-rl-course/unitbonus1/introduction
+  - A *longer tutorial* to understand how works ML-Agents:
+  https://huggingface.co/learn/deep-rl-course/unit5/introduction
   ### Resume the training
+  ```bash
   mlagents-learn <your_configuration_file_path.yaml> --run-id=<run_id> --resume
   ```
   ### Watch your Agent play
+  You can watch your agent **playing directly in your browser**
+  1. If the environment is part of ML-Agents official environments, go to https://huggingface.co/unity
+  2. Step 1: Find your model_id: azaazato/ppo-Huggy
   3. Step 2: Select your *.nn /*.onnx file
   4. Click on Watch the agent play 👀

config.json CHANGED Viewed

@@ -1 +1 @@

- {"default_settings": null, "behaviors": {"Huggy": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 2048, "buffer_size": 20480, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "network_settings": {"normalize": true, "hidden_units": 512, "num_layers": 3, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.995, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 15, "~~checkpoint_interval~~": ~~200000~~, "max_steps": 2000000, "time_horizon": 1000, "summary_freq": 50000, "threaded": false, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./trained-envs-executables/linux/Huggy/Huggy", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true}, "environment_parameters": null, "checkpoint_settings": {"run_id": "~~Huggy~~", "initialize_from": null, "load_model": false, "resume": false, "force": ~~false~~, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

+ {"default_settings": null, "behaviors": {"Huggy": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 2048, "buffer_size": 20480, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 200000, "network_settings": {"normalize": true, "hidden_units": 512, "num_layers": 3, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.995, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 15, "even_checkpoints": false, "max_steps": 2000000, "time_horizon": 1000, "summary_freq": 50000, "threaded": false, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./trained-envs-executables/linux/Huggy/Huggy", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "Huggy2", "initialize_from": null, "load_model": false, "resume": false, "force": true, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

configuration.yaml CHANGED Viewed

@@ -10,9 +10,11 @@ behaviors:
       epsilon: 0.2
       lambd: 0.95
       num_epoch: 3
       learning_rate_schedule: linear
       beta_schedule: linear
       epsilon_schedule: linear
     network_settings:
       normalize: true
       hidden_units: 512
@@ -35,7 +37,7 @@ behaviors:
           deterministic: false
     init_path: null
     keep_checkpoints: 15
-    checkpoint_interval: 200000
     max_steps: 2000000
     time_horizon: 1000
     summary_freq: 50000
@@ -48,6 +50,7 @@ env_settings:
   base_port: 5005
   num_envs: 1
   num_areas: 1
   seed: -1
   max_lifetime_restarts: 10
   restarts_rate_limit_n: 1
@@ -60,13 +63,14 @@ engine_settings:
   target_frame_rate: -1
   capture_frame_rate: 60
   no_graphics: true
 environment_parameters: null
 checkpoint_settings:
-  run_id: Huggy
   initialize_from: null
   load_model: false
   resume: false
-  force: false
   train_model: false
   inference: false
   results_dir: results

       epsilon: 0.2
       lambd: 0.95
       num_epoch: 3
+      shared_critic: false
       learning_rate_schedule: linear
       beta_schedule: linear
       epsilon_schedule: linear
+    checkpoint_interval: 200000
     network_settings:
       normalize: true
       hidden_units: 512
           deterministic: false
     init_path: null
     keep_checkpoints: 15
+    even_checkpoints: false
     max_steps: 2000000
     time_horizon: 1000
     summary_freq: 50000
   base_port: 5005
   num_envs: 1
   num_areas: 1
+  timeout_wait: 60
   seed: -1
   max_lifetime_restarts: 10
   restarts_rate_limit_n: 1
   target_frame_rate: -1
   capture_frame_rate: 60
   no_graphics: true
+  no_graphics_monitor: false
 environment_parameters: null
 checkpoint_settings:
+  run_id: Huggy2
   initialize_from: null
   load_model: false
   resume: false
+  force: true
   train_model: false
   inference: false
   results_dir: results

run_logs/timers.json CHANGED Viewed

@@ -1,367 +1,45 @@
 {
     "name": "root",
-    "gauges": {
-        "Huggy.Policy.Entropy.mean": {
-            "value": 1.4060659408569336,
-            "min": 1.4060659408569336,
-            "max": 1.4315779209136963,
-            "count": 40
-        },
-        "Huggy.Policy.Entropy.sum": {
-            "value": 70076.921875,
-            "min": 68163.3125,
-            "max": 78823.0625,
-            "count": 40
-        },
-        "Huggy.Environment.EpisodeLength.mean": {
-            "value": 95.30057803468208,
-            "min": 84.09013605442176,
-            "max": 380.91603053435114,
-            "count": 40
-        },
-        "Huggy.Environment.EpisodeLength.sum": {
-            "value": 49461.0,
-            "min": 48870.0,
-            "max": 50034.0,
-            "count": 40
-        },
-        "Huggy.Step.mean": {
-            "value": 1999905.0,
-            "min": 49810.0,
-            "max": 1999905.0,
-            "count": 40
-        },
-        "Huggy.Step.sum": {
-            "value": 1999905.0,
-            "min": 49810.0,
-            "max": 1999905.0,
-            "count": 40
-        },
-        "Huggy.Policy.ExtrinsicValueEstimate.mean": {
-            "value": 2.411778450012207,
-            "min": 0.06771308928728104,
-            "max": 2.4655308723449707,
-            "count": 40
-        },
-        "Huggy.Policy.ExtrinsicValueEstimate.sum": {
-            "value": 1251.7130126953125,
-            "min": 8.802701950073242,
-            "max": 1396.031005859375,
-            "count": 40
-        },
-        "Huggy.Environment.CumulativeReward.mean": {
-            "value": 3.7844826048509232,
-            "min": 1.8963831330721195,
-            "max": 3.932653166745838,
-            "count": 40
-        },
-        "Huggy.Environment.CumulativeReward.sum": {
-            "value": 1964.1464719176292,
-            "min": 246.52980729937553,
-            "max": 2218.038535296917,
-            "count": 40
-        },
-        "Huggy.Policy.ExtrinsicReward.mean": {
-            "value": 3.7844826048509232,
-            "min": 1.8963831330721195,
-            "max": 3.932653166745838,
-            "count": 40
-        },
-        "Huggy.Policy.ExtrinsicReward.sum": {
-            "value": 1964.1464719176292,
-            "min": 246.52980729937553,
-            "max": 2218.038535296917,
-            "count": 40
-        },
-        "Huggy.Losses.PolicyLoss.mean": {
-            "value": 0.016120348759351248,
-            "min": 0.014345712727905871,
-            "max": 0.019013986076849204,
-            "count": 40
-        },
-        "Huggy.Losses.PolicyLoss.sum": {
-            "value": 0.048361046278053745,
-            "min": 0.03087165418449634,
-            "max": 0.05704195823054761,
-            "count": 40
-        },
-        "Huggy.Losses.ValueLoss.mean": {
-            "value": 0.05144879606862863,
-            "min": 0.020817248274882634,
-            "max": 0.05970884294559558,
-            "count": 40
-        },
-        "Huggy.Losses.ValueLoss.sum": {
-            "value": 0.1543463882058859,
-            "min": 0.04163449654976527,
-            "max": 0.173665156836311,
-            "count": 40
-        },
-        "Huggy.Policy.LearningRate.mean": {
-            "value": 3.4034988655333344e-06,
-            "min": 3.4034988655333344e-06,
-            "max": 0.00029531017656327487,
-            "count": 40
-        },
-        "Huggy.Policy.LearningRate.sum": {
-            "value": 1.0210496596600003e-05,
-            "min": 1.0210496596600003e-05,
-            "max": 0.0008441998686000501,
-            "count": 40
-        },
-        "Huggy.Policy.Epsilon.mean": {
-            "value": 0.10113446666666669,
-            "min": 0.10113446666666669,
-            "max": 0.198436725,
-            "count": 40
-        },
-        "Huggy.Policy.Epsilon.sum": {
-            "value": 0.30340340000000005,
-            "min": 0.20742860000000005,
-            "max": 0.58139995,
-            "count": 40
-        },
-        "Huggy.Policy.Beta.mean": {
-            "value": 6.66098866666667e-05,
-            "min": 6.66098866666667e-05,
-            "max": 0.004921992577500001,
-            "count": 40
-        },
-        "Huggy.Policy.Beta.sum": {
-            "value": 0.00019982966000000007,
-            "min": 0.00019982966000000007,
-            "max": 0.014071857505000004,
-            "count": 40
-        },
-        "Huggy.IsTraining.mean": {
-            "value": 1.0,
-            "min": 1.0,
-            "max": 1.0,
-            "count": 40
-        },
-        "Huggy.IsTraining.sum": {
-            "value": 1.0,
-            "min": 1.0,
-            "max": 1.0,
-            "count": 40
-        }
-    },
     "metadata": {
         "timer_format_version": "0.1.0",
-        "start_time_seconds": "1675774841",
-        "python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]",
-        "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/Huggy.yaml --env=./trained-envs-executables/linux/Huggy/Huggy --run-id=Huggy --no-graphics",
-        "mlagents_version": "0.29.0.dev0",
-        "mlagents_envs_version": "0.29.0.dev0",
         "communication_protocol_version": "1.5.0",
-        "pytorch_version": "1.8.1+cu102",
-        "numpy_version": "1.21.6",
-        "end_time_seconds": "1675777341"
     },
-    "total": 2499.553229916,
     "count": 1,
-    "self": 0.38974296400010644,
     "children": {
         "run_training.setup": {
-            "total": 0.12540149000000156,
             "count": 1,
-            "self": 0.12540149000000156
         },
         "TrainerController.start_learning": {
-            "total": 2499.038085462,
             "count": 1,
-            "self": 4.459906200040223,
             "children": {
                 "TrainerController._reset_env": {
-                    "total": 11.430268882999997,
                     "count": 1,
-                    "self": 11.430268882999997
-                },
-                "TrainerController.advance": {
-                    "total": 2483.02428767096,
-                    "count": 231887,
-                    "self": 4.80020010498356,
-                    "children": {
-                        "env_step": {
-                            "total": 1936.3103898659372,
-                            "count": 231887,
-                            "self": 1612.945572966961,
-                            "children": {
-                                "SubprocessEnvManager._take_step": {
-                                    "total": 320.3758816540504,
-                                    "count": 231887,
-                                    "self": 16.48313822310297,
-                                    "children": {
-                                        "TorchPolicy.evaluate": {
-                                            "total": 303.8927434309474,
-                                            "count": 223039,
-                                            "self": 76.1059216419576,
-                                            "children": {
-                                                "TorchPolicy.sample_actions": {
-                                                    "total": 227.7868217889898,
-                                                    "count": 223039,
-                                                    "self": 227.7868217889898
-                                                }
-                                            }
-                                        }
-                                    }
-                                },
-                                "workers": {
-                                    "total": 2.9889352449258126,
-                                    "count": 231887,
-                                    "self": 0.0,
-                                    "children": {
-                                        "worker_root": {
-                                            "total": 2490.4996110509,
-                                            "count": 231887,
-                                            "is_parallel": true,
-                                            "self": 1181.961858940976,
-                                            "children": {
-                                                "run_training.setup": {
-                                                    "total": 0.0,
-                                                    "count": 0,
-                                                    "is_parallel": true,
-                                                    "self": 0.0,
-                                                    "children": {
-                                                        "steps_from_proto": {
-                                                            "total": 0.0035053580000408147,
-                                                            "count": 1,
-                                                            "is_parallel": true,
-                                                            "self": 0.0003519030000802559,
-                                                            "children": {
-                                                                "_process_rank_one_or_two_observation": {
-                                                                    "total": 0.0031534549999605588,
-                                                                    "count": 2,
-                                                                    "is_parallel": true,
-                                                                    "self": 0.0031534549999605588
-                                                                }
-                                                            }
-                                                        },
-                                                        "UnityEnvironment.step": {
-                                                            "total": 0.06337132800001655,
-                                                            "count": 1,
-                                                            "is_parallel": true,
-                                                            "self": 0.000358854000012343,
-                                                            "children": {
-                                                                "UnityEnvironment._generate_step_input": {
-                                                                    "total": 0.00021737800000209972,
-                                                                    "count": 1,
-                                                                    "is_parallel": true,
-                                                                    "self": 0.00021737800000209972
-                                                                },
-                                                                "communicator.exchange": {
-                                                                    "total": 0.062010756000006495,
-                                                                    "count": 1,
-                                                                    "is_parallel": true,
-                                                                    "self": 0.062010756000006495
-                                                                },
-                                                                "steps_from_proto": {
-                                                                    "total": 0.0007843399999956091,
-                                                                    "count": 1,
-                                                                    "is_parallel": true,
-                                                                    "self": 0.00028456799992682136,
-                                                                    "children": {
-                                                                        "_process_rank_one_or_two_observation": {
-                                                                            "total": 0.0004997720000687877,
-                                                                            "count": 2,
-                                                                            "is_parallel": true,
-                                                                            "self": 0.0004997720000687877
-                                                                        }
-                                                                    }
-                                                                }
-                                                            }
-                                                        }
-                                                    }
-                                                },
-                                                "UnityEnvironment.step": {
-                                                    "total": 1308.537752109924,
-                                                    "count": 231886,
-                                                    "is_parallel": true,
-                                                    "self": 38.942038724876056,
-                                                    "children": {
-                                                        "UnityEnvironment._generate_step_input": {
-                                                            "total": 82.73317857093588,
-                                                            "count": 231886,
-                                                            "is_parallel": true,
-                                                            "self": 82.73317857093588
-                                                        },
-                                                        "communicator.exchange": {
-                                                            "total": 1090.6349302629594,
-                                                            "count": 231886,
-                                                            "is_parallel": true,
-                                                            "self": 1090.6349302629594
-                                                        },
-                                                        "steps_from_proto": {
-                                                            "total": 96.22760455115247,
-                                                            "count": 231886,
-                                                            "is_parallel": true,
-                                                            "self": 41.294710258310715,
-                                                            "children": {
-                                                                "_process_rank_one_or_two_observation": {
-                                                                    "total": 54.93289429284175,
-                                                                    "count": 463772,
-                                                                    "is_parallel": true,
-                                                                    "self": 54.93289429284175
-                                                                }
-                                                            }
-                                                        }
-                                                    }
-                                                }
-                                            }
-                                        }
-                                    }
-                                }
-                            }
-                        },
-                        "trainer_advance": {
-                            "total": 541.9136977000394,
-                            "count": 231887,
-                            "self": 6.891252809051366,
-                            "children": {
-                                "process_trajectory": {
-                                    "total": 168.41609711199072,
-                                    "count": 231887,
-                                    "self": 167.1537047229911,
-                                    "children": {
-                                        "RLTrainer._checkpoint": {
-                                            "total": 1.262392388999615,
-                                            "count": 10,
-                                            "self": 1.262392388999615
-                                        }
-                                    }
-                                },
-                                "_update_policy": {
-                                    "total": 366.6063477789973,
-                                    "count": 97,
-                                    "self": 308.5765702070148,
-                                    "children": {
-                                        "TorchPPOOptimizer.update": {
-                                            "total": 58.02977757198249,
-                                            "count": 2910,
-                                            "self": 58.02977757198249
-                                        }
-                                    }
-                                }
-                            }
-                        }
-                    }
                 },
                 "trainer_threads": {
-                    "total": 8.279998837679159e-07,
                     "count": 1,
-                    "self": 8.279998837679159e-07
                 },
                 "TrainerController._save_models": {
-                    "total": 0.12362187999997332,
                     "count": 1,
-                    "self": 0.002087185999698704,
-                    "children": {
-                        "RLTrainer._checkpoint": {
-                            "total": 0.12153469400027461,
-                            "count": 1,
-                            "self": 0.12153469400027461
-                        }
-                    }
                 }
             }
         }

 {
     "name": "root",
     "metadata": {
         "timer_format_version": "0.1.0",
+        "start_time_seconds": "1762173766",
+        "python_version": "3.10.12 (main, Jul  5 2023, 18:54:27) [GCC 11.2.0]",
+        "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/Huggy.yaml --env=./trained-envs-executables/linux/Huggy/Huggy --run-id=Huggy2 --no-graphics --force",
+        "mlagents_version": "1.2.0.dev0",
+        "mlagents_envs_version": "1.2.0.dev0",
         "communication_protocol_version": "1.5.0",
+        "pytorch_version": "2.8.0+cu128",
+        "numpy_version": "1.23.5",
+        "end_time_seconds": "1762173766"
     },
+    "total": 0.04546879700001227,
     "count": 1,
+    "self": 0.007940021000194974,
     "children": {
         "run_training.setup": {
+            "total": 0.023404353999922023,
             "count": 1,
+            "self": 0.023404353999922023
         },
         "TrainerController.start_learning": {
+            "total": 0.014124421999895276,
             "count": 1,
+            "self": 0.0003588899999158457,
             "children": {
                 "TrainerController._reset_env": {
+                    "total": 0.013742294000167021,
                     "count": 1,
+                    "self": 0.013742294000167021
                 },
                 "trainer_threads": {
+                    "total": 1.4979996194597334e-06,
                     "count": 1,
+                    "self": 1.4979996194597334e-06
                 },
                 "TrainerController._save_models": {
+                    "total": 2.1740000192949083e-05,
                     "count": 1,
+                    "self": 2.1740000192949083e-05
                 }
             }
         }

run_logs/training_status.json CHANGED Viewed

@@ -1,119 +1,7 @@
 {
-    "Huggy": {
-        "checkpoints": [
-            {
-                "steps": 199966,
-                "file_path": "results/Huggy/Huggy/Huggy-199966.onnx",
-                "reward": 3.425651775797208,
-                "creation_time": 1675775098.1742382,
-                "auxillary_file_paths": [
-                    "results/Huggy/Huggy/Huggy-199966.pt"
-                ]
-            },
-            {
-                "steps": 399948,
-                "file_path": "results/Huggy/Huggy/Huggy-399948.onnx",
-                "reward": 3.8748908042907715,
-                "creation_time": 1675775352.17324,
-                "auxillary_file_paths": [
-                    "results/Huggy/Huggy/Huggy-399948.pt"
-                ]
-            },
-            {
-                "steps": 599968,
-                "file_path": "results/Huggy/Huggy/Huggy-599968.onnx",
-                "reward": 3.5677208367146944,
-                "creation_time": 1675775606.0478587,
-                "auxillary_file_paths": [
-                    "results/Huggy/Huggy/Huggy-599968.pt"
-                ]
-            },
-            {
-                "steps": 799998,
-                "file_path": "results/Huggy/Huggy/Huggy-799998.onnx",
-                "reward": 3.773281857992212,
-                "creation_time": 1675775858.7409933,
-                "auxillary_file_paths": [
-                    "results/Huggy/Huggy/Huggy-799998.pt"
-                ]
-            },
-            {
-                "steps": 999841,
-                "file_path": "results/Huggy/Huggy/Huggy-999841.onnx",
-                "reward": 3.8870706538685034,
-                "creation_time": 1675776109.7399635,
-                "auxillary_file_paths": [
-                    "results/Huggy/Huggy/Huggy-999841.pt"
-                ]
-            },
-            {
-                "steps": 1199402,
-                "file_path": "results/Huggy/Huggy/Huggy-1199402.onnx",
-                "reward": 3.251411199569702,
-                "creation_time": 1675776355.9214182,
-                "auxillary_file_paths": [
-                    "results/Huggy/Huggy/Huggy-1199402.pt"
-                ]
-            },
-            {
-                "steps": 1399908,
-                "file_path": "results/Huggy/Huggy/Huggy-1399908.onnx",
-                "reward": 4.009560413658619,
-                "creation_time": 1675776604.0595386,
-                "auxillary_file_paths": [
-                    "results/Huggy/Huggy/Huggy-1399908.pt"
-                ]
-            },
-            {
-                "steps": 1599898,
-                "file_path": "results/Huggy/Huggy/Huggy-1599898.onnx",
-                "reward": 3.570658856845764,
-                "creation_time": 1675776848.6336129,
-                "auxillary_file_paths": [
-                    "results/Huggy/Huggy/Huggy-1599898.pt"
-                ]
-            },
-            {
-                "steps": 1799958,
-                "file_path": "results/Huggy/Huggy/Huggy-1799958.onnx",
-                "reward": 3.881925370433543,
-                "creation_time": 1675777095.2964113,
-                "auxillary_file_paths": [
-                    "results/Huggy/Huggy/Huggy-1799958.pt"
-                ]
-            },
-            {
-                "steps": 1999905,
-                "file_path": "results/Huggy/Huggy/Huggy-1999905.onnx",
-                "reward": 3.977051999833849,
-                "creation_time": 1675777340.8340354,
-                "auxillary_file_paths": [
-                    "results/Huggy/Huggy/Huggy-1999905.pt"
-                ]
-            },
-            {
-                "steps": 2000030,
-                "file_path": "results/Huggy/Huggy/Huggy-2000030.onnx",
-                "reward": 4.080118775367737,
-                "creation_time": 1675777340.964843,
-                "auxillary_file_paths": [
-                    "results/Huggy/Huggy/Huggy-2000030.pt"
-                ]
-            }
-        ],
-        "final_checkpoint": {
-            "steps": 2000030,
-            "file_path": "results/Huggy/Huggy.onnx",
-            "reward": 4.080118775367737,
-            "creation_time": 1675777340.964843,
-            "auxillary_file_paths": [
-                "results/Huggy/Huggy/Huggy-2000030.pt"
-            ]
-        }
-    },
     "metadata": {
         "stats_format_version": "0.3.0",
-        "mlagents_version": "0.29.0.dev0",
-        "torch_version": "1.8.1+cu102"
     }
 }

 {
     "metadata": {
         "stats_format_version": "0.3.0",
+        "mlagents_version": "1.2.0.dev0",
+        "torch_version": "2.8.0+cu128"
     }
 }