{ "nbformat": 4, "nbformat_minor": 0, "metadata": { "colab": { "provenance": [] }, "kernelspec": { "name": "python3", "display_name": "Python 3" }, "language_info": { "name": "python" } }, "cells": [ { "cell_type": "code", "source": [ "%%capture\n", "# Clone the repository\n", "!git clone --depth 1 --branch hf-integration https://github.com/huggingface/ml-agents" ], "metadata": { "id": "G4mCAG8VD-IC" }, "execution_count": 2, "outputs": [] }, { "cell_type": "code", "source": [ "%%capture\n", "# Go inside the repository and install the package\n", "%cd ml-agents\n", "!pip3 install -e ./ml-agents-envs\n", "!pip3 install -e ./ml-agents" ], "metadata": { "id": "NcpEBgG4ETH2" }, "execution_count": 3, "outputs": [] }, { "cell_type": "code", "source": [ "# Here, we create training-envs-executables and linux\n", "!mkdir ./training-envs-executables\n", "!mkdir ./training-envs-executables/linux" ], "metadata": { "id": "lXhbEf4uEYL8" }, "execution_count": 4, "outputs": [] }, { "cell_type": "code", "source": [ "\n", "!wget --load-cookies /tmp/cookies.txt \"https://docs.google.com/uc?export=download&confirm=$(wget --quiet --save-cookies /tmp/cookies.txt --keep-session-cookies --no-check-certificate 'https://docs.google.com/uc?export=download&id=1UiFNdKlsH0NTu32xV-giYUEVKV4-vc7H' -O- | sed -rn 's/.*confirm=([0-9A-Za-z_]+).*/\\1\\n/p')&id=1UiFNdKlsH0NTu32xV-giYUEVKV4-vc7H\" -O ./training-envs-executables/linux/Pyramids.zip && rm -rf /tmp/cookies.txt" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "uLDPaf0PFAsO", "outputId": "0eb271bb-6847-434a-c86b-037f4bbc4ae4" }, "execution_count": 8, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "--2023-03-29 06:35:26-- https://docs.google.com/uc?export=download&confirm=t&id=1UiFNdKlsH0NTu32xV-giYUEVKV4-vc7H\n", "Resolving docs.google.com (docs.google.com)... 74.125.124.101, 74.125.124.102, 74.125.124.100, ...\n", "Connecting to docs.google.com (docs.google.com)|74.125.124.101|:443... connected.\n", "HTTP request sent, awaiting response... 303 See Other\n", "Location: https://doc-04-8c-docs.googleusercontent.com/docs/securesc/ha0ro937gcuc7l7deffksulhg5h7mbp1/rjm8bjnjjbaceuunacqhu0f96cocc32v/1680071700000/09764732090272539193/*/1UiFNdKlsH0NTu32xV-giYUEVKV4-vc7H?e=download&uuid=29de938c-bba9-4c4e-ab49-c669aefc08dc [following]\n", "Warning: wildcards not supported in HTTP.\n", "--2023-03-29 06:35:26-- https://doc-04-8c-docs.googleusercontent.com/docs/securesc/ha0ro937gcuc7l7deffksulhg5h7mbp1/rjm8bjnjjbaceuunacqhu0f96cocc32v/1680071700000/09764732090272539193/*/1UiFNdKlsH0NTu32xV-giYUEVKV4-vc7H?e=download&uuid=29de938c-bba9-4c4e-ab49-c669aefc08dc\n", "Resolving doc-04-8c-docs.googleusercontent.com (doc-04-8c-docs.googleusercontent.com)... 142.250.159.132, 2607:f8b0:4001:c58::84\n", "Connecting to doc-04-8c-docs.googleusercontent.com (doc-04-8c-docs.googleusercontent.com)|142.250.159.132|:443... connected.\n", "HTTP request sent, awaiting response... 200 OK\n", "Length: 42907187 (41M) [application/zip]\n", "Saving to: ‘./training-envs-executables/linux/Pyramids.zip’\n", "\n", "./training-envs-exe 100%[===================>] 40.92M 150MB/s in 0.3s \n", "\n", "2023-03-29 06:35:26 (150 MB/s) - ‘./training-envs-executables/linux/Pyramids.zip’ saved [42907187/42907187]\n", "\n" ] } ] }, { "cell_type": "code", "source": [ "%%capture\n", "!unzip -d ./training-envs-executables/linux/ ./training-envs-executables/linux/Pyramids.zip" ], "metadata": { "id": "mYB8LtCgD41b" }, "execution_count": 9, "outputs": [] }, { "cell_type": "code", "source": [ "!chmod -R 755 ./training-envs-executables/linux/Pyramids/Pyramids" ], "metadata": { "id": "xwUAhMU7EDOx" }, "execution_count": null, "outputs": [] }, { "cell_type": "code", "source": [ "!mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=\"Pyramids Training\" --no-graphics" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "s-73GPpPEHDl", "outputId": "351b355b-728e-4dae-a941-482c272d64d0" }, "execution_count": 10, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "\n", " ┐ ╖\n", " ╓╖╬│╡ ││╬╖╖\n", " ╓╖╬│││││┘ ╬│││││╬╖\n", " ╖╬│││││╬╜ ╙╬│││││╖╖ ╗╗╗\n", " ╬╬╬╬╖││╦╖ ╖╬││╗╣╣╣╬ ╟╣╣╬ ╟╣╣╣ ╜╜╜ ╟╣╣\n", " ╬╬╬╬╬╬╬╬╖│╬╖╖╓╬╪│╓╣╣╣╣╣╣╣╬ ╟╣╣╬ ╟╣╣╣ ╒╣╣╖╗╣╣╣╗ ╣╣╣ ╣╣╣╣╣╣ ╟╣╣╖ ╣╣╣\n", " ╬╬╬╬┐ ╙╬╬╬╬│╓╣╣╣╝╜ ╫╣╣╣╬ ╟╣╣╬ ╟╣╣╣ ╟╣╣╣╙ ╙╣╣╣ ╣╣╣ ╙╟╣╣╜╙ ╫╣╣ ╟╣╣\n", " ╬╬╬╬┐ ╙╬╬╣╣ ╫╣╣╣╬ ╟╣╣╬ ╟╣╣╣ ╟╣╣╬ ╣╣╣ ╣╣╣ ╟╣╣ ╣╣╣┌╣╣╜\n", " ╬╬╬╜ ╬╬╣╣ ╙╝╣╣╬ ╙╣╣╣╗╖╓╗╣╣╣╜ ╟╣╣╬ ╣╣╣ ╣╣╣ ╟╣╣╦╓ ╣╣╣╣╣\n", " ╙ ╓╦╖ ╬╬╣╣ ╓╗╗╖ ╙╝╣╣╣╣╝╜ ╘╝╝╜ ╝╝╝ ╝╝╝ ╙╣╣╣ ╟╣╣╣\n", " ╩╬╬╬╬╬╬╦╦╬╬╣╣╗╣╣╣╣╣╣╣╝ ╫╣╣╣╣\n", " ╙╬╬╬╬╬╬╬╣╣╣╣╣╣╝╜\n", " ╙╬╬╬╣╣╣╜\n", " ╙\n", " \n", " Version information:\n", " ml-agents: 0.31.0.dev0,\n", " ml-agents-envs: 0.31.0.dev0,\n", " Communicator API: 1.5.0,\n", " PyTorch: 1.11.0+cu102\n", "[INFO] Connected to Unity environment with package version 2.2.1-exp.1 and communication version 1.5.0\n", "[INFO] Connected new brain: Pyramids?team=0\n", "2023-03-29 06:36:53.359663: I tensorflow/core/platform/cpu_feature_guard.cc:193] This TensorFlow binary is optimized with oneAPI Deep Neural Network Library (oneDNN) to use the following CPU instructions in performance-critical operations: AVX2 FMA\n", "To enable them in other operations, rebuild TensorFlow with the appropriate compiler flags.\n", "2023-03-29 06:36:58.264300: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer.so.7'; dlerror: libnvinfer.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /usr/local/nvidia/lib:/usr/local/nvidia/lib64\n", "2023-03-29 06:36:58.266029: W tensorflow/compiler/xla/stream_executor/platform/default/dso_loader.cc:64] Could not load dynamic library 'libnvinfer_plugin.so.7'; dlerror: libnvinfer_plugin.so.7: cannot open shared object file: No such file or directory; LD_LIBRARY_PATH: /usr/local/nvidia/lib:/usr/local/nvidia/lib64\n", "2023-03-29 06:36:58.266820: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Cannot dlopen some TensorRT libraries. If you would like to use Nvidia GPU with TensorRT, please make sure the missing libraries mentioned above are installed properly.\n", "[INFO] Hyperparameters for behavior name Pyramids: \n", "\ttrainer_type:\tppo\n", "\thyperparameters:\t\n", "\t batch_size:\t128\n", "\t buffer_size:\t2048\n", "\t learning_rate:\t0.0003\n", "\t beta:\t0.01\n", "\t epsilon:\t0.2\n", "\t lambd:\t0.95\n", "\t num_epoch:\t3\n", "\t shared_critic:\tFalse\n", "\t learning_rate_schedule:\tlinear\n", "\t beta_schedule:\tlinear\n", "\t epsilon_schedule:\tlinear\n", "\tcheckpoint_interval:\t500000\n", "\tnetwork_settings:\t\n", "\t normalize:\tFalse\n", "\t hidden_units:\t512\n", "\t num_layers:\t2\n", "\t vis_encode_type:\tsimple\n", "\t memory:\tNone\n", "\t goal_conditioning_type:\thyper\n", "\t deterministic:\tFalse\n", "\treward_signals:\t\n", "\t extrinsic:\t\n", "\t gamma:\t0.99\n", "\t strength:\t1.0\n", "\t network_settings:\t\n", "\t normalize:\tFalse\n", "\t hidden_units:\t128\n", "\t num_layers:\t2\n", "\t vis_encode_type:\tsimple\n", "\t memory:\tNone\n", "\t goal_conditioning_type:\thyper\n", "\t deterministic:\tFalse\n", "\t rnd:\t\n", "\t gamma:\t0.99\n", "\t strength:\t0.01\n", "\t network_settings:\t\n", "\t normalize:\tFalse\n", "\t hidden_units:\t64\n", "\t num_layers:\t3\n", "\t vis_encode_type:\tsimple\n", "\t memory:\tNone\n", "\t goal_conditioning_type:\thyper\n", "\t deterministic:\tFalse\n", "\t learning_rate:\t0.0001\n", "\t encoding_size:\tNone\n", "\tinit_path:\tNone\n", "\tkeep_checkpoints:\t5\n", "\teven_checkpoints:\tFalse\n", "\tmax_steps:\t3000000\n", "\ttime_horizon:\t128\n", "\tsummary_freq:\t30000\n", "\tthreaded:\tFalse\n", "\tself_play:\tNone\n", "\tbehavioral_cloning:\tNone\n", "[INFO] Pyramids. Step: 30000. Time Elapsed: 101.455 s. Mean Reward: -0.872. Std of Reward: 0.514. Training.\n", "[INFO] Pyramids. Step: 60000. Time Elapsed: 199.014 s. Mean Reward: -0.933. Std of Reward: 0.368. Training.\n", "[INFO] Pyramids. Step: 90000. Time Elapsed: 300.673 s. Mean Reward: -0.863. Std of Reward: 0.529. Training.\n", "[INFO] Pyramids. Step: 120000. Time Elapsed: 400.459 s. Mean Reward: -0.850. Std of Reward: 0.583. Training.\n", "[INFO] Pyramids. Step: 150000. Time Elapsed: 504.687 s. Mean Reward: -0.581. Std of Reward: 0.894. Training.\n", "[INFO] Pyramids. Step: 180000. Time Elapsed: 612.085 s. Mean Reward: -0.855. Std of Reward: 0.559. Training.\n", "[INFO] Pyramids. Step: 210000. Time Elapsed: 717.356 s. Mean Reward: -0.404. Std of Reward: 1.000. Training.\n", "[INFO] Pyramids. Step: 240000. Time Elapsed: 823.675 s. Mean Reward: -0.597. Std of Reward: 0.936. Training.\n", "[INFO] Pyramids. Step: 270000. Time Elapsed: 927.453 s. Mean Reward: -0.514. Std of Reward: 0.959. Training.\n", "[INFO] Pyramids. Step: 300000. Time Elapsed: 1026.001 s. Mean Reward: -0.525. Std of Reward: 0.968. Training.\n", "[INFO] Pyramids. Step: 330000. Time Elapsed: 1126.188 s. Mean Reward: -0.349. Std of Reward: 1.075. Training.\n", "[INFO] Pyramids. Step: 360000. Time Elapsed: 1230.222 s. Mean Reward: 0.189. Std of Reward: 1.232. Training.\n", "[INFO] Pyramids. Step: 390000. Time Elapsed: 1334.848 s. Mean Reward: 0.015. Std of Reward: 1.212. Training.\n", "[INFO] Pyramids. Step: 420000. Time Elapsed: 1448.564 s. Mean Reward: 0.789. Std of Reward: 1.101. Training.\n", "[INFO] Pyramids. Step: 450000. Time Elapsed: 1570.904 s. Mean Reward: 1.062. Std of Reward: 0.976. Training.\n", "[INFO] Pyramids. Step: 480000. Time Elapsed: 1689.276 s. Mean Reward: 1.207. Std of Reward: 0.893. Training.\n", "[INFO] Exported results/Pyramids Training/Pyramids/Pyramids-499916.onnx\n", "[INFO] Pyramids. Step: 510000. Time Elapsed: 1806.577 s. Mean Reward: 1.311. Std of Reward: 0.847. Training.\n", "[INFO] Pyramids. Step: 540000. Time Elapsed: 1920.003 s. Mean Reward: 1.129. Std of Reward: 0.993. Training.\n", "[INFO] Pyramids. Step: 570000. Time Elapsed: 2037.317 s. Mean Reward: 1.326. Std of Reward: 0.800. Training.\n", "[INFO] Pyramids. Step: 600000. Time Elapsed: 2159.034 s. Mean Reward: 1.396. Std of Reward: 0.709. Training.\n", "[INFO] Pyramids. Step: 630000. Time Elapsed: 2277.282 s. Mean Reward: 1.261. Std of Reward: 0.901. Training.\n", "[INFO] Pyramids. Step: 660000. Time Elapsed: 2410.636 s. Mean Reward: 1.548. Std of Reward: 0.543. Training.\n", "[INFO] Pyramids. Step: 690000. Time Elapsed: 2553.031 s. Mean Reward: 1.605. Std of Reward: 0.506. Training.\n", "[INFO] Pyramids. Step: 720000. Time Elapsed: 2695.693 s. Mean Reward: 1.661. Std of Reward: 0.410. Training.\n", "[INFO] Pyramids. Step: 750000. Time Elapsed: 2832.742 s. Mean Reward: 1.621. Std of Reward: 0.504. Training.\n", "[INFO] Pyramids. Step: 780000. Time Elapsed: 2960.088 s. Mean Reward: 1.627. Std of Reward: 0.433. Training.\n", "[INFO] Pyramids. Step: 810000. Time Elapsed: 3089.164 s. Mean Reward: 1.628. Std of Reward: 0.340. Training.\n", "[INFO] Pyramids. Step: 840000. Time Elapsed: 3224.046 s. Mean Reward: 1.569. Std of Reward: 0.583. Training.\n", "[INFO] Pyramids. Step: 870000. Time Elapsed: 3361.922 s. Mean Reward: 1.666. Std of Reward: 0.407. Training.\n", "[INFO] Pyramids. Step: 900000. Time Elapsed: 3491.083 s. Mean Reward: 1.700. Std of Reward: 0.391. Training.\n", "[INFO] Pyramids. Step: 930000. Time Elapsed: 3622.705 s. Mean Reward: 1.674. Std of Reward: 0.328. Training.\n", "[INFO] Pyramids. Step: 960000. Time Elapsed: 3748.747 s. Mean Reward: 1.663. Std of Reward: 0.420. Training.\n", "[INFO] Pyramids. Step: 990000. Time Elapsed: 3884.888 s. Mean Reward: 1.720. Std of Reward: 0.186. Training.\n", "[INFO] Exported results/Pyramids Training/Pyramids/Pyramids-999942.onnx\n", "[INFO] Pyramids. Step: 1020000. Time Elapsed: 4022.687 s. Mean Reward: 1.743. Std of Reward: 0.283. Training.\n", "[INFO] Pyramids. Step: 1050000. Time Elapsed: 4149.459 s. Mean Reward: 1.689. Std of Reward: 0.328. Training.\n", "[INFO] Pyramids. Step: 1080000. Time Elapsed: 4274.465 s. Mean Reward: 1.575. Std of Reward: 0.671. Training.\n", "[INFO] Pyramids. Step: 1110000. Time Elapsed: 4404.286 s. Mean Reward: 1.636. Std of Reward: 0.498. Training.\n", "[INFO] Pyramids. Step: 1140000. Time Elapsed: 4533.829 s. Mean Reward: 1.686. Std of Reward: 0.395. Training.\n", "[INFO] Pyramids. Step: 1170000. Time Elapsed: 4666.266 s. Mean Reward: 1.724. Std of Reward: 0.285. Training.\n", "[INFO] Pyramids. Step: 1200000. Time Elapsed: 4802.121 s. Mean Reward: 1.673. Std of Reward: 0.475. Training.\n", "[INFO] Pyramids. Step: 1230000. Time Elapsed: 4936.895 s. Mean Reward: 1.718. Std of Reward: 0.312. Training.\n", "[INFO] Pyramids. Step: 1260000. Time Elapsed: 5075.556 s. Mean Reward: 1.630. Std of Reward: 0.588. Training.\n", "[INFO] Pyramids. Step: 1290000. Time Elapsed: 5205.058 s. Mean Reward: 1.721. Std of Reward: 0.299. Training.\n", "[INFO] Pyramids. Step: 1320000. Time Elapsed: 5341.708 s. Mean Reward: 1.700. Std of Reward: 0.323. Training.\n", "[INFO] Pyramids. Step: 1350000. Time Elapsed: 5475.899 s. Mean Reward: 1.742. Std of Reward: 0.149. Training.\n", "[INFO] Pyramids. Step: 1380000. Time Elapsed: 5604.559 s. Mean Reward: 1.652. Std of Reward: 0.549. Training.\n", "[INFO] Pyramids. Step: 1410000. Time Elapsed: 5746.207 s. Mean Reward: 1.663. Std of Reward: 0.584. Training.\n", "[INFO] Pyramids. Step: 1440000. Time Elapsed: 5886.518 s. Mean Reward: 1.703. Std of Reward: 0.397. Training.\n", "[INFO] Pyramids. Step: 1470000. Time Elapsed: 6024.444 s. Mean Reward: 1.687. Std of Reward: 0.469. Training.\n", "[INFO] Pyramids. Step: 1500000. Time Elapsed: 6162.328 s. Mean Reward: 1.722. Std of Reward: 0.297. Training.\n", "[INFO] Exported results/Pyramids Training/Pyramids/Pyramids-1499974.onnx\n", "[INFO] Pyramids. Step: 1530000. Time Elapsed: 6307.136 s. Mean Reward: 1.705. Std of Reward: 0.389. Training.\n", "[INFO] Pyramids. Step: 1560000. Time Elapsed: 6452.765 s. Mean Reward: 1.708. Std of Reward: 0.454. Training.\n", "[INFO] Pyramids. Step: 1590000. Time Elapsed: 6584.716 s. Mean Reward: 1.665. Std of Reward: 0.483. Training.\n", "[INFO] Pyramids. Step: 1620000. Time Elapsed: 6724.784 s. Mean Reward: 1.720. Std of Reward: 0.436. Training.\n", "[INFO] Pyramids. Step: 1650000. Time Elapsed: 6858.409 s. Mean Reward: 1.706. Std of Reward: 0.446. Training.\n", "[INFO] Pyramids. Step: 1680000. Time Elapsed: 6985.550 s. Mean Reward: 1.720. Std of Reward: 0.389. Training.\n", "[INFO] Pyramids. Step: 1710000. Time Elapsed: 7119.326 s. Mean Reward: 1.710. Std of Reward: 0.439. Training.\n", "[INFO] Pyramids. Step: 1740000. Time Elapsed: 7256.310 s. Mean Reward: 1.741. Std of Reward: 0.360. Training.\n", "[INFO] Pyramids. Step: 1770000. Time Elapsed: 7393.341 s. Mean Reward: 1.748. Std of Reward: 0.369. Training.\n", "[INFO] Pyramids. Step: 1800000. Time Elapsed: 7531.948 s. Mean Reward: 1.764. Std of Reward: 0.264. Training.\n", "[INFO] Pyramids. Step: 1830000. Time Elapsed: 7666.819 s. Mean Reward: 1.760. Std of Reward: 0.276. Training.\n", "[INFO] Pyramids. Step: 1860000. Time Elapsed: 7799.391 s. Mean Reward: 1.758. Std of Reward: 0.170. Training.\n", "[INFO] Pyramids. Step: 1890000. Time Elapsed: 7932.572 s. Mean Reward: 1.744. Std of Reward: 0.284. Training.\n", "[INFO] Pyramids. Step: 1920000. Time Elapsed: 8066.671 s. Mean Reward: 1.773. Std of Reward: 0.139. Training.\n", "[INFO] Pyramids. Step: 1950000. Time Elapsed: 8207.269 s. Mean Reward: 1.768. Std of Reward: 0.161. Training.\n", "[INFO] Pyramids. Step: 1980000. Time Elapsed: 8346.790 s. Mean Reward: 1.802. Std of Reward: 0.109. Training.\n", "[INFO] Exported results/Pyramids Training/Pyramids/Pyramids-1999967.onnx\n", "[INFO] Pyramids. Step: 2010000. Time Elapsed: 8481.710 s. Mean Reward: 1.732. Std of Reward: 0.428. Training.\n", "[INFO] Pyramids. Step: 2040000. Time Elapsed: 8613.497 s. Mean Reward: 1.703. Std of Reward: 0.448. Training.\n", "[INFO] Pyramids. Step: 2070000. Time Elapsed: 8749.200 s. Mean Reward: 1.754. Std of Reward: 0.177. Training.\n", "[INFO] Pyramids. Step: 2100000. Time Elapsed: 8885.866 s. Mean Reward: 1.760. Std of Reward: 0.282. Training.\n", "[INFO] Pyramids. Step: 2130000. Time Elapsed: 9023.976 s. Mean Reward: 1.770. Std of Reward: 0.162. Training.\n", "[INFO] Pyramids. Step: 2160000. Time Elapsed: 9166.838 s. Mean Reward: 1.742. Std of Reward: 0.410. Training.\n", "[INFO] Pyramids. Step: 2190000. Time Elapsed: 9307.147 s. Mean Reward: 1.770. Std of Reward: 0.273. Training.\n", "[INFO] Pyramids. Step: 2220000. Time Elapsed: 9441.487 s. Mean Reward: 1.707. Std of Reward: 0.388. Training.\n", "[INFO] Pyramids. Step: 2250000. Time Elapsed: 9581.738 s. Mean Reward: 1.784. Std of Reward: 0.130. Training.\n", "[INFO] Pyramids. Step: 2280000. Time Elapsed: 9719.787 s. Mean Reward: 1.757. Std of Reward: 0.274. Training.\n", "[INFO] Pyramids. Step: 2310000. Time Elapsed: 9857.539 s. Mean Reward: 1.770. Std of Reward: 0.153. Training.\n", "[INFO] Pyramids. Step: 2340000. Time Elapsed: 9987.205 s. Mean Reward: 1.725. Std of Reward: 0.375. Training.\n", "[INFO] Pyramids. Step: 2370000. Time Elapsed: 10117.730 s. Mean Reward: 1.736. Std of Reward: 0.308. Training.\n", "[INFO] Pyramids. Step: 2400000. Time Elapsed: 10252.886 s. Mean Reward: 1.733. Std of Reward: 0.373. Training.\n", "[INFO] Pyramids. Step: 2430000. Time Elapsed: 10397.404 s. Mean Reward: 1.761. Std of Reward: 0.267. Training.\n", "[INFO] Pyramids. Step: 2460000. Time Elapsed: 10533.164 s. Mean Reward: 1.777. Std of Reward: 0.272. Training.\n", "[INFO] Pyramids. Step: 2490000. Time Elapsed: 10675.384 s. Mean Reward: 1.791. Std of Reward: 0.121. Training.\n", "[INFO] Exported results/Pyramids Training/Pyramids/Pyramids-2499954.onnx\n", "[INFO] Pyramids. Step: 2520000. Time Elapsed: 10817.342 s. Mean Reward: 1.752. Std of Reward: 0.353. Training.\n", "[INFO] Pyramids. Step: 2550000. Time Elapsed: 10957.949 s. Mean Reward: 1.795. Std of Reward: 0.118. Training.\n", "[INFO] Pyramids. Step: 2580000. Time Elapsed: 11093.594 s. Mean Reward: 1.733. Std of Reward: 0.427. Training.\n", "[INFO] Pyramids. Step: 2610000. Time Elapsed: 11227.655 s. Mean Reward: 1.716. Std of Reward: 0.449. Training.\n", "[INFO] Pyramids. Step: 2640000. Time Elapsed: 11362.885 s. Mean Reward: 1.776. Std of Reward: 0.150. Training.\n", "[INFO] Pyramids. Step: 2670000. Time Elapsed: 11500.539 s. Mean Reward: 1.715. Std of Reward: 0.443. Training.\n", "[INFO] Pyramids. Step: 2700000. Time Elapsed: 11643.585 s. Mean Reward: 1.728. Std of Reward: 0.433. Training.\n", "[INFO] Pyramids. Step: 2730000. Time Elapsed: 11778.876 s. Mean Reward: 1.760. Std of Reward: 0.280. Training.\n", "[INFO] Pyramids. Step: 2760000. Time Elapsed: 11917.592 s. Mean Reward: 1.770. Std of Reward: 0.267. Training.\n", "[INFO] Pyramids. Step: 2790000. Time Elapsed: 12051.461 s. Mean Reward: 1.749. Std of Reward: 0.360. Training.\n", "[INFO] Pyramids. Step: 2820000. Time Elapsed: 12191.994 s. Mean Reward: 1.768. Std of Reward: 0.350. Training.\n", "[INFO] Pyramids. Step: 2850000. Time Elapsed: 12319.137 s. Mean Reward: 1.681. Std of Reward: 0.522. Training.\n", "[INFO] Pyramids. Step: 2880000. Time Elapsed: 12457.755 s. Mean Reward: 1.741. Std of Reward: 0.414. Training.\n", "[INFO] Pyramids. Step: 2910000. Time Elapsed: 12583.409 s. Mean Reward: 1.736. Std of Reward: 0.366. Training.\n", "[INFO] Pyramids. Step: 2940000. Time Elapsed: 12717.883 s. Mean Reward: 1.780. Std of Reward: 0.139. Training.\n", "[INFO] Pyramids. Step: 2970000. Time Elapsed: 12853.405 s. Mean Reward: 1.773. Std of Reward: 0.268. Training.\n", "[INFO] Pyramids. Step: 3000000. Time Elapsed: 12983.290 s. Mean Reward: 1.697. Std of Reward: 0.507. Training.\n", "[INFO] Exported results/Pyramids Training/Pyramids/Pyramids-2999875.onnx\n", "[INFO] Exported results/Pyramids Training/Pyramids/Pyramids-3000131.onnx\n", "[INFO] Copied results/Pyramids Training/Pyramids/Pyramids-3000131.onnx to results/Pyramids Training/Pyramids.onnx.\n" ] } ] }, { "cell_type": "code", "source": [ "!mlagents-push-to-hf --run-id=\"Pyramids Training\" --local-dir=\"/content/ml-agents/results/Pyramids Training\" --repo-id=\"DrishtiSharma/ppo-Pyramids\" --commit-message=\"First Push\"" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "5BHFfKX16gzn", "outputId": "9d73f2cc-4f86-4a6a-c3d1-921028364e38" }, "execution_count": 33, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "/content/ml-agents/hub/ppo-Pyramids is already a clone of https://huggingface.co/DrishtiSharma/ppo-Pyramids. Make sure you pull the latest changes with `repo.git_pull()`.\n", "WARNING:huggingface_hub.repository:/content/ml-agents/hub/ppo-Pyramids is already a clone of https://huggingface.co/DrishtiSharma/ppo-Pyramids. Make sure you pull the latest changes with `repo.git_pull()`.\n", "Upload file Pyramids-1499974.pt: 0% 32.0k/8.25M [00:00 main\n", "\n", "WARNING:huggingface_hub.repository:To https://huggingface.co/DrishtiSharma/ppo-Pyramids\n", " 1cfb7ee..62da25f main -> main\n", "\n", "Upload file Pyramids-1499974.pt: 100% 8.25M/8.25M [00:04<00:00, 2.15MB/s]\n", "\n", "Upload file Pyramids-2499954.onnx: 100% 1.35M/1.35M [00:04<00:00, 345kB/s]\u001b[A\n", "Upload file Pyramids-2499954.onnx: 100% 1.35M/1.35M [00:04<00:00, 345kB/s]\n", "\n", "\n", "Upload file Pyramids-2999875.onnx: 100% 1.35M/1.35M [00:04<00:00, 345kB/s]\u001b[A\u001b[A\n", "\n", "Upload file Pyramids-2999875.onnx: 100% 1.35M/1.35M [00:04<00:00, 345kB/s]\n", "\n", "\n", "\n", "Upload file Pyramids-1499974.onnx: 100% 1.35M/1.35M [00:04<00:00, 345kB/s]\u001b[A\u001b[A\u001b[A\n", "\n", "\n", "Upload file Pyramids-1499974.onnx: 100% 1.35M/1.35M [00:04<00:00, 345kB/s]\n", "\n", "\n", "\n", "\n", "Upload file Pyramids-2499954.pt: 100% 8.25M/8.25M [00:04<00:00, 2.05MB/s]\u001b[A\u001b[A\u001b[A\u001b[A\n", "\n", "\n", "\n", "Upload file Pyramids-2499954.pt: 100% 8.25M/8.25M [00:04<00:00, 2.15MB/s]\n", "\n", "\n", "\n", "\n", "\n", "Upload file Pyramids-3000131.pt: 100% 8.25M/8.25M [00:04<00:00, 2.07MB/s]\u001b[A\u001b[A\u001b[A\u001b[A\u001b[A\n", "\n", "\n", "\n", "\n", "Upload file Pyramids-3000131.pt: 100% 8.25M/8.25M [00:04<00:00, 2.15MB/s]\n", "\n", "\n", "\n", "\n", "\n", "\n", "Upload file Pyramids-1999967.pt: 100% 8.25M/8.25M [00:04<00:00, 2.02MB/s]\u001b[A\u001b[A\u001b[A\u001b[A\u001b[A\u001b[A\n", "\n", "\n", "\n", "\n", "\n", "Upload file Pyramids-1999967.pt: 100% 8.25M/8.25M [00:04<00:00, 2.15MB/s]\n", "\n", "\n", "\n", "\n", "\n", "\n", "\n", "Upload file Pyramids-2999875.pt: 100% 8.25M/8.25M [00:04<00:00, 2.05MB/s]\u001b[A\u001b[A\u001b[A\u001b[A\u001b[A\u001b[A\u001b[A\n", "\n", "\n", "\n", "\n", "\n", "\n", "Upload file Pyramids-2999875.pt: 100% 8.25M/8.25M [00:04<00:00, 2.15MB/s]\n", "\n", "\n", "\n", "\n", "\n", "\n", "\n", "\n", "Upload file Pyramids-1999967.onnx: 100% 1.35M/1.35M [00:03<00:00, 460kB/s]\u001b[A\u001b[A\u001b[A\u001b[A\u001b[A\u001b[A\u001b[A\u001b[A\n", "\n", "\n", "\n", "\n", "\n", "\n", "\n", "Upload file Pyramids-1999967.onnx: 100% 1.35M/1.35M [00:03<00:00, 460kB/s]\n", "\n", "\n", "\n", "\n", "\n", "\n", "\n", "\n", "\n", "Upload file Pyramids/events.out.tfevents.1680071821.5e4b33e6d482.1878.0: 100% 885k/885k [00:03<00:00, 290kB/s]\u001b[A\u001b[A\u001b[A\u001b[A\u001b[A\u001b[A\u001b[A\u001b[A\u001b[A\n", "\n", "\n", "\n", "\n", "\n", "\n", "\n", "\n", "Upload file Pyramids/events.out.tfevents.1680071821.5e4b33e6d482.1878.0: 100% 885k/885k [00:03<00:00, 290kB/s]\n", "\n", " Your model is pushed to the hub. You can view your model here: https://huggingface.co/DrishtiSharma/ppo-Pyramids\n" ] } ] }, { "cell_type": "code", "source": [], "metadata": { "id": "MYEdml4j7JPg" }, "execution_count": null, "outputs": [] } ] }