Instructions to use HellsCreature/ppo-Huggy with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- ml-agents
How to use HellsCreature/ppo-Huggy with ml-agents:
mlagents-load-from-hf --repo-id="HellsCreature/ppo-Huggy" --local-dir="./download: string[]s"
- Notebooks
- Google Colab
- Kaggle
| { | |
| "name": "root", | |
| "gauges": { | |
| "Huggy.Policy.Entropy.mean": { | |
| "value": 1.405005931854248, | |
| "min": 1.405005931854248, | |
| "max": 1.4263216257095337, | |
| "count": 40 | |
| }, | |
| "Huggy.Policy.Entropy.sum": { | |
| "value": 71016.0234375, | |
| "min": 66023.828125, | |
| "max": 78459.921875, | |
| "count": 40 | |
| }, | |
| "Huggy.Environment.EpisodeLength.mean": { | |
| "value": 79.14423076923077, | |
| "min": 79.06487341772151, | |
| "max": 434.6, | |
| "count": 40 | |
| }, | |
| "Huggy.Environment.EpisodeLength.sum": { | |
| "value": 49386.0, | |
| "min": 48723.0, | |
| "max": 50266.0, | |
| "count": 40 | |
| }, | |
| "Huggy.Step.mean": { | |
| "value": 1999922.0, | |
| "min": 49681.0, | |
| "max": 1999922.0, | |
| "count": 40 | |
| }, | |
| "Huggy.Step.sum": { | |
| "value": 1999922.0, | |
| "min": 49681.0, | |
| "max": 1999922.0, | |
| "count": 40 | |
| }, | |
| "Huggy.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 2.4805476665496826, | |
| "min": 0.05684151127934456, | |
| "max": 2.5248899459838867, | |
| "count": 40 | |
| }, | |
| "Huggy.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 1547.86181640625, | |
| "min": 6.4799323081970215, | |
| "max": 1547.86181640625, | |
| "count": 40 | |
| }, | |
| "Huggy.Environment.CumulativeReward.mean": { | |
| "value": 3.7999223657907586, | |
| "min": 1.9112243423597854, | |
| "max": 4.042667640243322, | |
| "count": 40 | |
| }, | |
| "Huggy.Environment.CumulativeReward.sum": { | |
| "value": 2371.1515562534332, | |
| "min": 217.87957502901554, | |
| "max": 2388.8964752554893, | |
| "count": 40 | |
| }, | |
| "Huggy.Policy.ExtrinsicReward.mean": { | |
| "value": 3.7999223657907586, | |
| "min": 1.9112243423597854, | |
| "max": 4.042667640243322, | |
| "count": 40 | |
| }, | |
| "Huggy.Policy.ExtrinsicReward.sum": { | |
| "value": 2371.1515562534332, | |
| "min": 217.87957502901554, | |
| "max": 2388.8964752554893, | |
| "count": 40 | |
| }, | |
| "Huggy.Losses.PolicyLoss.mean": { | |
| "value": 0.01543372108313229, | |
| "min": 0.01349670224590227, | |
| "max": 0.020799967853236012, | |
| "count": 40 | |
| }, | |
| "Huggy.Losses.PolicyLoss.sum": { | |
| "value": 0.04630116324939687, | |
| "min": 0.02699340449180454, | |
| "max": 0.058431782506522714, | |
| "count": 40 | |
| }, | |
| "Huggy.Losses.ValueLoss.mean": { | |
| "value": 0.05906954109668731, | |
| "min": 0.02102249873181184, | |
| "max": 0.06229535359889269, | |
| "count": 40 | |
| }, | |
| "Huggy.Losses.ValueLoss.sum": { | |
| "value": 0.17720862329006193, | |
| "min": 0.04204499746362368, | |
| "max": 0.17833154785136382, | |
| "count": 40 | |
| }, | |
| "Huggy.Policy.LearningRate.mean": { | |
| "value": 3.4934988355333354e-06, | |
| "min": 3.4934988355333354e-06, | |
| "max": 0.0002953377015541, | |
| "count": 40 | |
| }, | |
| "Huggy.Policy.LearningRate.sum": { | |
| "value": 1.0480496506600006e-05, | |
| "min": 1.0480496506600006e-05, | |
| "max": 0.0008441677686107498, | |
| "count": 40 | |
| }, | |
| "Huggy.Policy.Epsilon.mean": { | |
| "value": 0.10116446666666667, | |
| "min": 0.10116446666666667, | |
| "max": 0.19844590000000006, | |
| "count": 40 | |
| }, | |
| "Huggy.Policy.Epsilon.sum": { | |
| "value": 0.3034934, | |
| "min": 0.20746395000000006, | |
| "max": 0.58138925, | |
| "count": 40 | |
| }, | |
| "Huggy.Policy.Beta.mean": { | |
| "value": 6.810688666666673e-05, | |
| "min": 6.810688666666673e-05, | |
| "max": 0.004922450409999999, | |
| "count": 40 | |
| }, | |
| "Huggy.Policy.Beta.sum": { | |
| "value": 0.00020432066000000018, | |
| "min": 0.00020432066000000018, | |
| "max": 0.014071323575, | |
| "count": 40 | |
| }, | |
| "Huggy.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 40 | |
| }, | |
| "Huggy.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 40 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1775319491", | |
| "python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]", | |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/Huggy.yaml --env=./trained-envs-executables/linux/Huggy/Huggy --run-id=Huggy2 --no-graphics", | |
| "mlagents_version": "1.2.0.dev0", | |
| "mlagents_envs_version": "1.2.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "2.8.0+cu128", | |
| "numpy_version": "1.23.5", | |
| "end_time_seconds": "1775324058" | |
| }, | |
| "total": 4566.802021547001, | |
| "count": 1, | |
| "self": 1.7076093120012956, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.03326064300017606, | |
| "count": 1, | |
| "self": 0.03326064300017606 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 4565.061151591999, | |
| "count": 1, | |
| "self": 7.778489825886936, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 3.412156143000175, | |
| "count": 1, | |
| "self": 3.412156143000175 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 4553.720171484114, | |
| "count": 232641, | |
| "self": 7.944058931618201, | |
| "children": { | |
| "env_step": { | |
| "total": 3088.9355124970607, | |
| "count": 232641, | |
| "self": 2627.737857952503, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 456.0585929994977, | |
| "count": 232641, | |
| "self": 27.9070279371208, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 428.1515650623769, | |
| "count": 222981, | |
| "self": 428.1515650623769 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 5.139061545060031, | |
| "count": 232641, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 4542.519983906968, | |
| "count": 232641, | |
| "is_parallel": true, | |
| "self": 2447.337797824559, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.0008736800009501167, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0002450720003253082, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0006286080006248085, | |
| "count": 2, | |
| "is_parallel": true, | |
| "self": 0.0006286080006248085 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.03435929499937629, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.00038820099871372804, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.0002232750011899043, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0002232750011899043 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.03294942600041395, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.03294942600041395 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.0007983929990587058, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0002162809978472069, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0005821120012114989, | |
| "count": 2, | |
| "is_parallel": true, | |
| "self": 0.0005821120012114989 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 2095.1821860824093, | |
| "count": 232640, | |
| "is_parallel": true, | |
| "self": 62.34558957979425, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 112.19080371913333, | |
| "count": 232640, | |
| "is_parallel": true, | |
| "self": 112.19080371913333 | |
| }, | |
| "communicator.exchange": { | |
| "total": 1785.3339640135637, | |
| "count": 232640, | |
| "is_parallel": true, | |
| "self": 1785.3339640135637 | |
| }, | |
| "steps_from_proto": { | |
| "total": 135.31182876991807, | |
| "count": 232640, | |
| "is_parallel": true, | |
| "self": 44.180447293936595, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 91.13138147598147, | |
| "count": 465280, | |
| "is_parallel": true, | |
| "self": 91.13138147598147 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 1456.840600055435, | |
| "count": 232641, | |
| "self": 12.111325549789399, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 234.63921871964703, | |
| "count": 232641, | |
| "self": 233.2922486126481, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 1.3469701069989242, | |
| "count": 10, | |
| "self": 1.3469701069989242 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 1210.0900557859986, | |
| "count": 97, | |
| "self": 312.0415895900205, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 898.0484661959781, | |
| "count": 2910, | |
| "self": 898.0484661959781 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 1.562999386806041e-06, | |
| "count": 1, | |
| "self": 1.562999386806041e-06 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.15033257599861827, | |
| "count": 1, | |
| "self": 0.0029366489998210454, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.14739592699879722, | |
| "count": 1, | |
| "self": 0.14739592699879722 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |