Instructions to use bittoby/ppo-Huggy with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- ml-agents
How to use bittoby/ppo-Huggy with ml-agents:
mlagents-load-from-hf --repo-id="bittoby/ppo-Huggy" --local-dir="./download: string[]s"
- Notebooks
- Google Colab
- Kaggle
| { | |
| "name": "root", | |
| "gauges": { | |
| "Huggy.Policy.Entropy.mean": { | |
| "value": 1.4030195474624634, | |
| "min": 1.4030195474624634, | |
| "max": 1.428842306137085, | |
| "count": 40 | |
| }, | |
| "Huggy.Policy.Entropy.sum": { | |
| "value": 70874.9375, | |
| "min": 67786.9296875, | |
| "max": 75039.9765625, | |
| "count": 40 | |
| }, | |
| "Huggy.Environment.EpisodeLength.mean": { | |
| "value": 88.46332737030411, | |
| "min": 79.23434991974318, | |
| "max": 369.3703703703704, | |
| "count": 40 | |
| }, | |
| "Huggy.Environment.EpisodeLength.sum": { | |
| "value": 49451.0, | |
| "min": 49180.0, | |
| "max": 49964.0, | |
| "count": 40 | |
| }, | |
| "Huggy.Step.mean": { | |
| "value": 1999271.0, | |
| "min": 49611.0, | |
| "max": 1999271.0, | |
| "count": 40 | |
| }, | |
| "Huggy.Step.sum": { | |
| "value": 1999271.0, | |
| "min": 49611.0, | |
| "max": 1999271.0, | |
| "count": 40 | |
| }, | |
| "Huggy.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 2.426896333694458, | |
| "min": 0.11408145725727081, | |
| "max": 2.507927417755127, | |
| "count": 40 | |
| }, | |
| "Huggy.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 1356.635009765625, | |
| "min": 15.286914825439453, | |
| "max": 1559.382080078125, | |
| "count": 40 | |
| }, | |
| "Huggy.Environment.CumulativeReward.mean": { | |
| "value": 3.686092944499205, | |
| "min": 1.8897129868838325, | |
| "max": 3.9215332741587474, | |
| "count": 40 | |
| }, | |
| "Huggy.Environment.CumulativeReward.sum": { | |
| "value": 2060.5259559750557, | |
| "min": 253.22154024243355, | |
| "max": 2433.4563893079758, | |
| "count": 40 | |
| }, | |
| "Huggy.Policy.ExtrinsicReward.mean": { | |
| "value": 3.686092944499205, | |
| "min": 1.8897129868838325, | |
| "max": 3.9215332741587474, | |
| "count": 40 | |
| }, | |
| "Huggy.Policy.ExtrinsicReward.sum": { | |
| "value": 2060.5259559750557, | |
| "min": 253.22154024243355, | |
| "max": 2433.4563893079758, | |
| "count": 40 | |
| }, | |
| "Huggy.Losses.PolicyLoss.mean": { | |
| "value": 0.018960492238127496, | |
| "min": 0.013081660444731823, | |
| "max": 0.02061250276528881, | |
| "count": 40 | |
| }, | |
| "Huggy.Losses.PolicyLoss.sum": { | |
| "value": 0.056881476714382484, | |
| "min": 0.026163320889463645, | |
| "max": 0.06183750829586643, | |
| "count": 40 | |
| }, | |
| "Huggy.Losses.ValueLoss.mean": { | |
| "value": 0.06338192377653387, | |
| "min": 0.02155718971043825, | |
| "max": 0.06338192377653387, | |
| "count": 40 | |
| }, | |
| "Huggy.Losses.ValueLoss.sum": { | |
| "value": 0.19014577132960161, | |
| "min": 0.0431143794208765, | |
| "max": 0.19014577132960161, | |
| "count": 40 | |
| }, | |
| "Huggy.Policy.LearningRate.mean": { | |
| "value": 3.5872988042666683e-06, | |
| "min": 3.5872988042666683e-06, | |
| "max": 0.00029537865154045, | |
| "count": 40 | |
| }, | |
| "Huggy.Policy.LearningRate.sum": { | |
| "value": 1.0761896412800004e-05, | |
| "min": 1.0761896412800004e-05, | |
| "max": 0.0008443029185657, | |
| "count": 40 | |
| }, | |
| "Huggy.Policy.Epsilon.mean": { | |
| "value": 0.10119573333333333, | |
| "min": 0.10119573333333333, | |
| "max": 0.19845954999999998, | |
| "count": 40 | |
| }, | |
| "Huggy.Policy.Epsilon.sum": { | |
| "value": 0.3035872, | |
| "min": 0.20753945000000001, | |
| "max": 0.5814343000000002, | |
| "count": 40 | |
| }, | |
| "Huggy.Policy.Beta.mean": { | |
| "value": 6.966709333333335e-05, | |
| "min": 6.966709333333335e-05, | |
| "max": 0.004923131545000001, | |
| "count": 40 | |
| }, | |
| "Huggy.Policy.Beta.sum": { | |
| "value": 0.00020900128000000007, | |
| "min": 0.00020900128000000007, | |
| "max": 0.01407357157, | |
| "count": 40 | |
| }, | |
| "Huggy.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 40 | |
| }, | |
| "Huggy.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 40 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1766413994", | |
| "python_version": "3.10.12 (main, Nov 4 2025, 08:48:33) [GCC 11.4.0]", | |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/Huggy.yaml --env=./trained-envs-executables/linux/Huggy/Huggy --run-id=Huggy --no-graphics", | |
| "mlagents_version": "1.2.0.dev0", | |
| "mlagents_envs_version": "1.2.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "2.8.0+cu128", | |
| "numpy_version": "1.23.5", | |
| "end_time_seconds": "1766417003" | |
| }, | |
| "total": 3008.4399569789994, | |
| "count": 1, | |
| "self": 0.8550145739991422, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.032072455000161426, | |
| "count": 1, | |
| "self": 0.032072455000161426 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 3007.55286995, | |
| "count": 1, | |
| "self": 5.905111663184471, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 3.5637167620000127, | |
| "count": 1, | |
| "self": 3.5637167620000127 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 2997.9178486508154, | |
| "count": 232688, | |
| "self": 5.5495252256910135, | |
| "children": { | |
| "env_step": { | |
| "total": 2450.0910307330864, | |
| "count": 232688, | |
| "self": 1977.7584741171381, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 468.6401643199058, | |
| "count": 232688, | |
| "self": 18.73896722677614, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 449.90119709312967, | |
| "count": 222964, | |
| "self": 449.90119709312967 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 3.692392296042499, | |
| "count": 232688, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 2992.220750970095, | |
| "count": 232688, | |
| "is_parallel": true, | |
| "self": 1394.050097105947, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.0009020099998906517, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0002559219999511697, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.000646087999939482, | |
| "count": 2, | |
| "is_parallel": true, | |
| "self": 0.000646087999939482 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.030953276999980517, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.00037018700004409766, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.00023222499999064894, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.00023222499999064894 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.029502222000019174, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.029502222000019174 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.0008486429999265965, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.00025535399981890805, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0005932890001076885, | |
| "count": 2, | |
| "is_parallel": true, | |
| "self": 0.0005932890001076885 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 1598.170653864148, | |
| "count": 232687, | |
| "is_parallel": true, | |
| "self": 45.390814673973864, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 92.16356163105047, | |
| "count": 232687, | |
| "is_parallel": true, | |
| "self": 92.16356163105047 | |
| }, | |
| "communicator.exchange": { | |
| "total": 1352.1120529010516, | |
| "count": 232687, | |
| "is_parallel": true, | |
| "self": 1352.1120529010516 | |
| }, | |
| "steps_from_proto": { | |
| "total": 108.50422465807219, | |
| "count": 232687, | |
| "is_parallel": true, | |
| "self": 36.907528690904655, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 71.59669596716753, | |
| "count": 465374, | |
| "is_parallel": true, | |
| "self": 71.59669596716753 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 542.2772926920379, | |
| "count": 232688, | |
| "self": 8.804529689173478, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 177.9177542778625, | |
| "count": 232688, | |
| "self": 176.67026571486258, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 1.2474885629999335, | |
| "count": 10, | |
| "self": 1.2474885629999335 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 355.5550087250019, | |
| "count": 97, | |
| "self": 285.56064945599064, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 69.99435926901128, | |
| "count": 2910, | |
| "self": 69.99435926901128 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 1.2760001482092775e-06, | |
| "count": 1, | |
| "self": 1.2760001482092775e-06 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.16619159800029593, | |
| "count": 1, | |
| "self": 0.002326895000805962, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.16386470299948996, | |
| "count": 1, | |
| "self": 0.16386470299948996 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |