{ "nbformat": 4, "nbformat_minor": 0, "metadata": { "colab": { "provenance": [], "gpuType": "T4" }, "kernelspec": { "name": "python3", "display_name": "Python 3" }, "language_info": { "name": "python" }, "accelerator": "GPU", "widgets": { "application/vnd.jupyter.widget-state+json": { "5e5f6d0bae264cb492b6dda56e53e074": { "model_module": "@jupyter-widgets/controls", "model_name": "VBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "VBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "VBoxView", "box_style": "", "children": [], "layout": "IPY_MODEL_bddcd0e0941f488fbb0d98ac264cb72a" } }, "eebf76576b7b4b719ac57de36e66382b": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_4e0e83a476a840fcb4c334efcd961a7a", "placeholder": "​", "style": "IPY_MODEL_a17b3df99ee941ad838e1ed455663f54", "value": "

Copy a token from your Hugging Face\ntokens page and paste it below.
Immediately click login after copying\nyour token or it might be stored in plain text in this notebook file.
" } }, "a1d0a8cf6fe54df887f65436d8935269": { "model_module": "@jupyter-widgets/controls", "model_name": "PasswordModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "PasswordModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "PasswordView", "continuous_update": true, "description": "Token:", "description_tooltip": null, "disabled": false, "layout": "IPY_MODEL_8e317e1fb21c46debc662b461e84c912", "placeholder": "​", "style": "IPY_MODEL_1c304f3e820e4b899f5349181570ed6e", "value": "" } }, "10366c39d49b4e6cb3d44166590352fc": { "model_module": "@jupyter-widgets/controls", "model_name": "CheckboxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "CheckboxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "CheckboxView", "description": "Add token as git credential?", "description_tooltip": null, "disabled": false, "indent": true, "layout": "IPY_MODEL_19ca5e456206449796b620ee5ec7f9fd", "style": "IPY_MODEL_0bed7d5da23c4fcbb2ef5e663ecfaeb6", "value": true } }, "145ed8fecddf49fe8f8f283d2d8ddab9": { "model_module": "@jupyter-widgets/controls", "model_name": "ButtonModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ButtonModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ButtonView", "button_style": "", "description": "Login", "disabled": false, "icon": "", "layout": "IPY_MODEL_861c2d5a72d34afab4e01ee72d6b23dc", "style": "IPY_MODEL_a25f6653fc0c4d599e16e8ad207e0884", "tooltip": "" } }, "96010313880644fa9b6293e41a150e5f": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_bbcc61b64eed4d2ea96e679ed66675af", "placeholder": "​", "style": "IPY_MODEL_6f78af7746864b40a1531f35e0e3ac11", "value": "\nPro Tip: If you don't already have one, you can create a dedicated\n'notebooks' token with 'write' access, that you can then easily reuse for all\nnotebooks. " } }, "bddcd0e0941f488fbb0d98ac264cb72a": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": "center", "align_self": null, "border": null, "bottom": null, "display": "flex", "flex": null, "flex_flow": "column", "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "50%" } }, "4e0e83a476a840fcb4c334efcd961a7a": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "a17b3df99ee941ad838e1ed455663f54": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "8e317e1fb21c46debc662b461e84c912": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "1c304f3e820e4b899f5349181570ed6e": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "19ca5e456206449796b620ee5ec7f9fd": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "0bed7d5da23c4fcbb2ef5e663ecfaeb6": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "861c2d5a72d34afab4e01ee72d6b23dc": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "a25f6653fc0c4d599e16e8ad207e0884": { "model_module": "@jupyter-widgets/controls", "model_name": "ButtonStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ButtonStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "button_color": null, "font_weight": "" } }, "bbcc61b64eed4d2ea96e679ed66675af": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "6f78af7746864b40a1531f35e0e3ac11": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "bad0550de5fc4c46acbae99e23dc164a": { "model_module": "@jupyter-widgets/controls", "model_name": "LabelModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "LabelModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "LabelView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_3df1ff9d97f141b0920407e52c698947", "placeholder": "​", "style": "IPY_MODEL_3e5cea3b91364b98bc36cb0e7c257043", "value": "Connecting..." } }, "3df1ff9d97f141b0920407e52c698947": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "3e5cea3b91364b98bc36cb0e7c257043": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "5020bf1e1c204e39ab31f056b3600741": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_d95cab9089d44bc6b5d52b0d76f1a46a", "IPY_MODEL_acb45e0fccbf4f69a16ad2cd49164f6b", "IPY_MODEL_32d3fe4e127e4df7a6b8fc9dac232f25" ], "layout": "IPY_MODEL_4a007e2d509b4680af0f604307c52f3e" } }, "d95cab9089d44bc6b5d52b0d76f1a46a": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_2d254d56520d4b918502fd16da289203", "placeholder": "​", "style": "IPY_MODEL_d5b08bebdfc94ded9fd423d6fd9d94ef", "value": "pytorch_variables.pth: 100%" } }, "acb45e0fccbf4f69a16ad2cd49164f6b": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_aac0fec03e9e4b44a9f8deffdb4d7f93", "max": 864, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_d95b3e2d64c747e0b935b027a4e88c06", "value": 864 } }, "32d3fe4e127e4df7a6b8fc9dac232f25": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_dccab72235324e33b70c19e9c588dad1", "placeholder": "​", "style": "IPY_MODEL_207406a8df3944b2b96b58c141e2aca3", "value": " 864/864 [00:00<00:00, 4.04kB/s]" } }, "4a007e2d509b4680af0f604307c52f3e": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "2d254d56520d4b918502fd16da289203": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "d5b08bebdfc94ded9fd423d6fd9d94ef": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "aac0fec03e9e4b44a9f8deffdb4d7f93": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "d95b3e2d64c747e0b935b027a4e88c06": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "dccab72235324e33b70c19e9c588dad1": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "207406a8df3944b2b96b58c141e2aca3": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "c91927a907374adea725820bb00e91ae": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_2eabca278c93495f80b9271cc390560b", "IPY_MODEL_56e518d75ba046e4a3820b476f17462b", "IPY_MODEL_9b9271c2afbf450aaf9f4095f3412bed" ], "layout": "IPY_MODEL_f873d40665304447ac1e98d56ff5f3d6" } }, "2eabca278c93495f80b9271cc390560b": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_47aeca0a5e954de499b19405b79b25a1", "placeholder": "​", "style": "IPY_MODEL_08399c618acd4cba93743b29aed2dcd0", "value": "Upload 5 LFS files: 100%" } }, "56e518d75ba046e4a3820b476f17462b": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_ffb3d541d4b34059a88cb8d1c962f5da", "max": 5, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_bf7bf33bc3e24c7b98e78ec284a5ab3a", "value": 5 } }, "9b9271c2afbf450aaf9f4095f3412bed": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_2aac7ba4f39c436abb63da4083ef33ef", "placeholder": "​", "style": "IPY_MODEL_71b3d9eccf2d40e48d9a4a7f07fceb1b", "value": " 5/5 [00:00<00:00,  1.72it/s]" } }, "f873d40665304447ac1e98d56ff5f3d6": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "47aeca0a5e954de499b19405b79b25a1": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "08399c618acd4cba93743b29aed2dcd0": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "ffb3d541d4b34059a88cb8d1c962f5da": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "bf7bf33bc3e24c7b98e78ec284a5ab3a": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "2aac7ba4f39c436abb63da4083ef33ef": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "71b3d9eccf2d40e48d9a4a7f07fceb1b": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "a6142dc28afa4dce9095f229dffabef0": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_10e1153970744479b3fd2426feb82fe1", "IPY_MODEL_b93a90d2a3554dbcb4c556c9c5c11ce2", "IPY_MODEL_03294e9be55a4772ae7f8e01910293c7" ], "layout": "IPY_MODEL_eac4c65316094066815d7240021e9ef3" } }, "10e1153970744479b3fd2426feb82fe1": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_a7d2d6e93bde42fdb7412cd3b97b31fc", "placeholder": "​", "style": "IPY_MODEL_f7b21bb1ce714f8cbcefc46bf1c15aa8", "value": "policy.pth: 100%" } }, "b93a90d2a3554dbcb4c556c9c5c11ce2": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_4400895276c340e89b2fbf42ba49d2dd", "max": 43762, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_30fc2f7a990d4e8b9c40ab184cedad40", "value": 43762 } }, "03294e9be55a4772ae7f8e01910293c7": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_bedb633c81294c108fdd3cb4e0be420f", "placeholder": "​", "style": "IPY_MODEL_528a81331da44e1c8db2813f3798e26b", "value": " 43.8k/43.8k [00:00<00:00, 143kB/s]" } }, "eac4c65316094066815d7240021e9ef3": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "a7d2d6e93bde42fdb7412cd3b97b31fc": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "f7b21bb1ce714f8cbcefc46bf1c15aa8": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "4400895276c340e89b2fbf42ba49d2dd": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "30fc2f7a990d4e8b9c40ab184cedad40": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "bedb633c81294c108fdd3cb4e0be420f": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "528a81331da44e1c8db2813f3798e26b": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "0e14da22c3d04dd4bc40b562451a8b19": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_40347b991af944c39d9ed612ebd9acb2", "IPY_MODEL_f1cf5da591c94b05bab9ad739f6856b4", "IPY_MODEL_7e7f04611a3b4206ac8ca419cb5d96a2" ], "layout": "IPY_MODEL_50cf39c800124d259a6295f63a43ee97" } }, "40347b991af944c39d9ed612ebd9acb2": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_704f6edda2284d599e70514be3148bdb", "placeholder": "​", "style": "IPY_MODEL_acafb84f9ee54157a58598516fd6fe7d", "value": "policy.optimizer.pth: 100%" } }, "f1cf5da591c94b05bab9ad739f6856b4": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_a985ac83e6f84d6f86aabc107aa2516e", "max": 88362, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_a5995786c1e0411cba8cd1e7f550cc15", "value": 88362 } }, "7e7f04611a3b4206ac8ca419cb5d96a2": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_05ebf165c08144cfaf8f67ed4830f515", "placeholder": "​", "style": "IPY_MODEL_ecfecaf9db4a467097db9030e0b3b7ed", "value": " 88.4k/88.4k [00:00<00:00, 138kB/s]" } }, "50cf39c800124d259a6295f63a43ee97": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "704f6edda2284d599e70514be3148bdb": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "acafb84f9ee54157a58598516fd6fe7d": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "a985ac83e6f84d6f86aabc107aa2516e": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "a5995786c1e0411cba8cd1e7f550cc15": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "05ebf165c08144cfaf8f67ed4830f515": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "ecfecaf9db4a467097db9030e0b3b7ed": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "19c5ab8146724dfbb027890c2ea2cf94": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_2875ccb651f440ef934ce1cb23543d93", "IPY_MODEL_b69d2dae1d9446cbabc5407d0ac5e980", "IPY_MODEL_623a4e087d29487ca5c7cf4347e8acce" ], "layout": "IPY_MODEL_ef57d76ccb2e4491a989a9b65c4b5805" } }, "2875ccb651f440ef934ce1cb23543d93": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_790b36d1910848ddbbc52269041a29e0", "placeholder": "​", "style": "IPY_MODEL_19af9a202ae24064ad33778aa8484214", "value": "ppo-LunarLander-v2.zip: 100%" } }, "b69d2dae1d9446cbabc5407d0ac5e980": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_eed1d3020cbd4107971fb729b9976290", "max": 147446, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_ec75022e31e84c1aa600d5cb3b63a988", "value": 147446 } }, "623a4e087d29487ca5c7cf4347e8acce": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_396f31725b554bfcbe7306457081098c", "placeholder": "​", "style": "IPY_MODEL_d84c2fc0f879448d80b147ffa51027a0", "value": " 147k/147k [00:00<00:00, 409kB/s]" } }, "ef57d76ccb2e4491a989a9b65c4b5805": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "790b36d1910848ddbbc52269041a29e0": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "19af9a202ae24064ad33778aa8484214": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "eed1d3020cbd4107971fb729b9976290": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "ec75022e31e84c1aa600d5cb3b63a988": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "396f31725b554bfcbe7306457081098c": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "d84c2fc0f879448d80b147ffa51027a0": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "4b7088e4bed9484d8cdd5351a2b5c41c": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_01604361dfb944b4832b84801a7d31e6", "IPY_MODEL_a6e5554de16246b2aa3537e29dbd71df", "IPY_MODEL_e4ccc6f1a58d446e85ffacb3231c0356" ], "layout": "IPY_MODEL_73dc03c3ff3e481f8394ea7c287f92be" } }, "01604361dfb944b4832b84801a7d31e6": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_ef31b8315d484a82b0af3900f4be78f9", "placeholder": "​", "style": "IPY_MODEL_4de6eaed1dc44babbb0404c84c5f1eca", "value": "replay.mp4: 100%" } }, "a6e5554de16246b2aa3537e29dbd71df": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_ebd4b0a6dc4d4f0d8f50a3983d294e4b", "max": 146181, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_ba80504ccda94041be1526348e9986dd", "value": 146181 } }, "e4ccc6f1a58d446e85ffacb3231c0356": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_5281d7c2987b47e0b94f96eee4f69cb6", "placeholder": "​", "style": "IPY_MODEL_6a5eafa9b02a4a9abc40a52f35a5a1db", "value": " 146k/146k [00:00<00:00, 363kB/s]" } }, "73dc03c3ff3e481f8394ea7c287f92be": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "ef31b8315d484a82b0af3900f4be78f9": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "4de6eaed1dc44babbb0404c84c5f1eca": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "ebd4b0a6dc4d4f0d8f50a3983d294e4b": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "ba80504ccda94041be1526348e9986dd": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "5281d7c2987b47e0b94f96eee4f69cb6": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "6a5eafa9b02a4a9abc40a52f35a5a1db": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } } } } }, "cells": [ { "cell_type": "code", "execution_count": 8, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "HPgTjD1qhN05", "outputId": "8eb7426a-0e16-400b-f2bf-d97f19728da8" }, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Reading package lists... Done\n", "Building dependency tree... Done\n", "Reading state information... Done\n", "swig is already the newest version (4.0.2-1ubuntu1).\n", "cmake is already the newest version (3.22.1-1ubuntu1.22.04.2).\n", "0 upgraded, 0 newly installed, 0 to remove and 47 not upgraded.\n" ] } ], "source": [ "!apt install swig cmake" ] }, { "cell_type": "code", "source": [ "!pip install -r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "Vlp7EePAh1px", "outputId": "16f3b2f7-feea-4c58-9d25-33825952662c" }, "execution_count": 9, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Requirement already satisfied: stable-baselines3==2.0.0a5 in /usr/local/lib/python3.11/dist-packages (from -r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (2.0.0a5)\n", "Requirement already satisfied: swig in /usr/local/lib/python3.11/dist-packages (from -r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 2)) (4.3.1)\n", "Requirement already satisfied: huggingface_sb3 in /usr/local/lib/python3.11/dist-packages (from -r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 4)) (3.0)\n", "Requirement already satisfied: gymnasium[box2d] in /usr/local/lib/python3.11/dist-packages (from -r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 3)) (0.28.1)\n", "Requirement already satisfied: numpy in /usr/local/lib/python3.11/dist-packages (from stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (2.0.2)\n", "Requirement already satisfied: torch>=1.11 in /usr/local/lib/python3.11/dist-packages (from stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (2.6.0+cu124)\n", "Requirement already satisfied: cloudpickle in /usr/local/lib/python3.11/dist-packages (from stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (3.1.1)\n", "Requirement already satisfied: pandas in /usr/local/lib/python3.11/dist-packages (from stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (2.2.2)\n", "Requirement already satisfied: matplotlib in /usr/local/lib/python3.11/dist-packages (from stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (3.10.0)\n", "Requirement already satisfied: jax-jumpy>=1.0.0 in /usr/local/lib/python3.11/dist-packages (from gymnasium[box2d]->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 3)) (1.0.0)\n", "Requirement already satisfied: typing-extensions>=4.3.0 in /usr/local/lib/python3.11/dist-packages (from gymnasium[box2d]->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 3)) (4.13.2)\n", "Requirement already satisfied: farama-notifications>=0.0.1 in /usr/local/lib/python3.11/dist-packages (from gymnasium[box2d]->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 3)) (0.0.4)\n", "Requirement already satisfied: box2d-py==2.3.5 in /usr/local/lib/python3.11/dist-packages (from gymnasium[box2d]->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 3)) (2.3.5)\n", "Requirement already satisfied: pygame==2.1.3 in /usr/local/lib/python3.11/dist-packages (from gymnasium[box2d]->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 3)) (2.1.3)\n", "Requirement already satisfied: huggingface-hub~=0.8 in /usr/local/lib/python3.11/dist-packages (from huggingface_sb3->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 4)) (0.31.4)\n", "Requirement already satisfied: pyyaml~=6.0 in /usr/local/lib/python3.11/dist-packages (from huggingface_sb3->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 4)) (6.0.2)\n", "Requirement already satisfied: wasabi in /usr/local/lib/python3.11/dist-packages (from huggingface_sb3->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 4)) (1.1.3)\n", "Requirement already satisfied: filelock in /usr/local/lib/python3.11/dist-packages (from huggingface-hub~=0.8->huggingface_sb3->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 4)) (3.18.0)\n", "Requirement already satisfied: fsspec>=2023.5.0 in /usr/local/lib/python3.11/dist-packages (from huggingface-hub~=0.8->huggingface_sb3->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 4)) (2025.3.2)\n", "Requirement already satisfied: packaging>=20.9 in /usr/local/lib/python3.11/dist-packages (from huggingface-hub~=0.8->huggingface_sb3->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 4)) (24.2)\n", "Requirement already satisfied: requests in /usr/local/lib/python3.11/dist-packages (from huggingface-hub~=0.8->huggingface_sb3->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 4)) (2.32.3)\n", "Requirement already satisfied: tqdm>=4.42.1 in /usr/local/lib/python3.11/dist-packages (from huggingface-hub~=0.8->huggingface_sb3->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 4)) (4.67.1)\n", "Requirement already satisfied: networkx in /usr/local/lib/python3.11/dist-packages (from torch>=1.11->stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (3.4.2)\n", "Requirement already satisfied: jinja2 in /usr/local/lib/python3.11/dist-packages (from torch>=1.11->stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (3.1.6)\n", "Requirement already satisfied: nvidia-cuda-nvrtc-cu12==12.4.127 in /usr/local/lib/python3.11/dist-packages (from torch>=1.11->stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (12.4.127)\n", "Requirement already satisfied: nvidia-cuda-runtime-cu12==12.4.127 in /usr/local/lib/python3.11/dist-packages (from torch>=1.11->stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (12.4.127)\n", "Requirement already satisfied: nvidia-cuda-cupti-cu12==12.4.127 in /usr/local/lib/python3.11/dist-packages (from torch>=1.11->stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (12.4.127)\n", "Requirement already satisfied: nvidia-cudnn-cu12==9.1.0.70 in /usr/local/lib/python3.11/dist-packages (from torch>=1.11->stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (9.1.0.70)\n", "Requirement already satisfied: nvidia-cublas-cu12==12.4.5.8 in /usr/local/lib/python3.11/dist-packages (from torch>=1.11->stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (12.4.5.8)\n", "Requirement already satisfied: nvidia-cufft-cu12==11.2.1.3 in /usr/local/lib/python3.11/dist-packages (from torch>=1.11->stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (11.2.1.3)\n", "Requirement already satisfied: nvidia-curand-cu12==10.3.5.147 in /usr/local/lib/python3.11/dist-packages (from torch>=1.11->stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (10.3.5.147)\n", "Requirement already satisfied: nvidia-cusolver-cu12==11.6.1.9 in /usr/local/lib/python3.11/dist-packages (from torch>=1.11->stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (11.6.1.9)\n", "Requirement already satisfied: nvidia-cusparse-cu12==12.3.1.170 in /usr/local/lib/python3.11/dist-packages (from torch>=1.11->stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (12.3.1.170)\n", "Requirement already satisfied: nvidia-cusparselt-cu12==0.6.2 in /usr/local/lib/python3.11/dist-packages (from torch>=1.11->stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (0.6.2)\n", "Requirement already satisfied: nvidia-nccl-cu12==2.21.5 in /usr/local/lib/python3.11/dist-packages (from torch>=1.11->stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (2.21.5)\n", "Requirement already satisfied: nvidia-nvtx-cu12==12.4.127 in /usr/local/lib/python3.11/dist-packages (from torch>=1.11->stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (12.4.127)\n", "Requirement already satisfied: nvidia-nvjitlink-cu12==12.4.127 in /usr/local/lib/python3.11/dist-packages (from torch>=1.11->stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (12.4.127)\n", "Requirement already satisfied: triton==3.2.0 in /usr/local/lib/python3.11/dist-packages (from torch>=1.11->stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (3.2.0)\n", "Requirement already satisfied: sympy==1.13.1 in /usr/local/lib/python3.11/dist-packages (from torch>=1.11->stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (1.13.1)\n", "Requirement already satisfied: mpmath<1.4,>=1.1.0 in /usr/local/lib/python3.11/dist-packages (from sympy==1.13.1->torch>=1.11->stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (1.3.0)\n", "Requirement already satisfied: contourpy>=1.0.1 in /usr/local/lib/python3.11/dist-packages (from matplotlib->stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (1.3.2)\n", "Requirement already satisfied: cycler>=0.10 in /usr/local/lib/python3.11/dist-packages (from matplotlib->stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (0.12.1)\n", "Requirement already satisfied: fonttools>=4.22.0 in /usr/local/lib/python3.11/dist-packages (from matplotlib->stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (4.58.0)\n", "Requirement already satisfied: kiwisolver>=1.3.1 in /usr/local/lib/python3.11/dist-packages (from matplotlib->stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (1.4.8)\n", "Requirement already satisfied: pillow>=8 in /usr/local/lib/python3.11/dist-packages (from matplotlib->stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (11.2.1)\n", "Requirement already satisfied: pyparsing>=2.3.1 in /usr/local/lib/python3.11/dist-packages (from matplotlib->stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (3.2.3)\n", "Requirement already satisfied: python-dateutil>=2.7 in /usr/local/lib/python3.11/dist-packages (from matplotlib->stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (2.9.0.post0)\n", "Requirement already satisfied: pytz>=2020.1 in /usr/local/lib/python3.11/dist-packages (from pandas->stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (2025.2)\n", "Requirement already satisfied: tzdata>=2022.7 in /usr/local/lib/python3.11/dist-packages (from pandas->stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (2025.2)\n", "Requirement already satisfied: six>=1.5 in /usr/local/lib/python3.11/dist-packages (from python-dateutil>=2.7->matplotlib->stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (1.17.0)\n", "Requirement already satisfied: MarkupSafe>=2.0 in /usr/local/lib/python3.11/dist-packages (from jinja2->torch>=1.11->stable-baselines3==2.0.0a5->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 1)) (3.0.2)\n", "Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.11/dist-packages (from requests->huggingface-hub~=0.8->huggingface_sb3->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 4)) (3.4.2)\n", "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.11/dist-packages (from requests->huggingface-hub~=0.8->huggingface_sb3->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 4)) (3.10)\n", "Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.11/dist-packages (from requests->huggingface-hub~=0.8->huggingface_sb3->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 4)) (2.4.0)\n", "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.11/dist-packages (from requests->huggingface-hub~=0.8->huggingface_sb3->-r https://raw.githubusercontent.com/huggingface/deep-rl-class/main/notebooks/unit1/requirements-unit1.txt (line 4)) (2025.4.26)\n" ] } ] }, { "cell_type": "code", "source": [ "!sudo apt-get update\n", "!sudo apt-get install -y python3-opengl\n", "!apt install ffmpeg\n", "!apt install xvfb\n", "!pip3 install pyvirtualdisplay" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "iKHH3oY2iEHg", "outputId": "7ed4efd7-2ce0-4fdb-ca81-679158e33cfc" }, "execution_count": 10, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "\r0% [Working]\r \rHit:1 https://cloud.r-project.org/bin/linux/ubuntu jammy-cran40/ InRelease\n", "\r0% [Waiting for headers] [Connecting to security.ubuntu.com (185.125.190.82)] [\r \rHit:2 https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/x86_64 InRelease\n", "Hit:3 http://archive.ubuntu.com/ubuntu jammy InRelease\n", "Hit:4 http://archive.ubuntu.com/ubuntu jammy-updates InRelease\n", "Hit:5 http://security.ubuntu.com/ubuntu jammy-security InRelease\n", "Hit:6 http://archive.ubuntu.com/ubuntu jammy-backports InRelease\n", "Hit:7 https://r2u.stat.illinois.edu/ubuntu jammy InRelease\n", "Hit:8 https://ppa.launchpadcontent.net/deadsnakes/ppa/ubuntu jammy InRelease\n", "Hit:9 https://ppa.launchpadcontent.net/graphics-drivers/ppa/ubuntu jammy InRelease\n", "Hit:10 https://ppa.launchpadcontent.net/ubuntugis/ppa/ubuntu jammy InRelease\n", "Reading package lists... Done\n", "W: Skipping acquire of configured file 'main/source/Sources' as repository 'https://r2u.stat.illinois.edu/ubuntu jammy InRelease' does not seem to provide it (sources.list entry misspelt?)\n", "Reading package lists... Done\n", "Building dependency tree... Done\n", "Reading state information... Done\n", "python3-opengl is already the newest version (3.1.5+dfsg-1).\n", "0 upgraded, 0 newly installed, 0 to remove and 47 not upgraded.\n", "Reading package lists... Done\n", "Building dependency tree... Done\n", "Reading state information... Done\n", "ffmpeg is already the newest version (7:4.4.2-0ubuntu0.22.04.1).\n", "0 upgraded, 0 newly installed, 0 to remove and 47 not upgraded.\n", "Reading package lists... Done\n", "Building dependency tree... Done\n", "Reading state information... Done\n", "xvfb is already the newest version (2:21.1.4-2ubuntu1.7~22.04.14).\n", "0 upgraded, 0 newly installed, 0 to remove and 47 not upgraded.\n", "Requirement already satisfied: pyvirtualdisplay in /usr/local/lib/python3.11/dist-packages (3.0)\n" ] } ] }, { "cell_type": "code", "source": [ "import os\n", "os.kill(os.getpid(), 9)" ], "metadata": { "id": "vJLiOmhiiRqe" }, "execution_count": null, "outputs": [] }, { "cell_type": "code", "source": [ "# Virtual display\n", "from pyvirtualdisplay import Display\n", "\n", "virtual_display = Display(visible=0, size=(1400, 900))\n", "virtual_display.start()" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "mkLXf2u1iVII", "outputId": "6bb6272d-b71c-42ba-cdb9-30d5c8a76f20" }, "execution_count": 1, "outputs": [ { "output_type": "execute_result", "data": { "text/plain": [ "" ] }, "metadata": {}, "execution_count": 1 } ] }, { "cell_type": "code", "source": [ "import gymnasium\n", "\n", "from huggingface_sb3 import load_from_hub, package_to_hub\n", "from huggingface_hub import notebook_login # To log to our Hugging Face account to be able to upload models to the Hub.\n", "\n", "from stable_baselines3 import PPO\n", "from stable_baselines3.common.env_util import make_vec_env\n", "from stable_baselines3.common.evaluation import evaluate_policy\n", "from stable_baselines3.common.monitor import Monitor" ], "metadata": { "id": "epcO9X2Aijmd" }, "execution_count": 2, "outputs": [] }, { "cell_type": "code", "source": [ "import gymnasium as gym\n", "\n", "# First, we create our environment called LunarLander-v2\n", "env = gym.make(\"LunarLander-v2\")\n", "\n", "# Then we reset this environment\n", "observation, info = env.reset()\n", "\n", "for _ in range(20):\n", " # Take a random action\n", " action = env.action_space.sample()\n", " print(\"Action taken:\", action)\n", "\n", " # Do this action in the environment and get\n", " # next_state, reward, terminated, truncated and info\n", " observation, reward, terminated, truncated, info = env.step(action)\n", "\n", " # If the game is terminated (in our case we land, crashed) or truncated (timeout)\n", " if terminated or truncated:\n", " # Reset the environment\n", " print(\"Environment is reset\")\n", " observation, info = env.reset()\n", "\n", "env.close()" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "duphyUfajB_Y", "outputId": "c9970f58-6bac-4c17-a6ae-3d309abb59fc" }, "execution_count": 3, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Action taken: 3\n", "Action taken: 2\n", "Action taken: 0\n", "Action taken: 2\n", "Action taken: 0\n", "Action taken: 2\n", "Action taken: 1\n", "Action taken: 1\n", "Action taken: 0\n", "Action taken: 0\n", "Action taken: 1\n", "Action taken: 2\n", "Action taken: 0\n", "Action taken: 2\n", "Action taken: 3\n", "Action taken: 3\n", "Action taken: 0\n", "Action taken: 2\n", "Action taken: 2\n", "Action taken: 0\n" ] } ] }, { "cell_type": "code", "source": [ "# We create our environment with gym.make(\"\")\n", "env = gym.make(\"LunarLander-v2\")\n", "env.reset()\n", "print(\"_____OBSERVATION SPACE_____ \\n\")\n", "print(\"Observation Space Shape\", env.observation_space.shape)\n", "print(\"Sample observation\", env.observation_space.sample()) # Get a random observation" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "XDsGJRCBjNb4", "outputId": "35c1d729-e6ff-472d-d8f6-bb5f41bedc51" }, "execution_count": 4, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "_____OBSERVATION SPACE_____ \n", "\n", "Observation Space Shape (8,)\n", "Sample observation [ 2.3788338 -46.57826 -0.81979173 1.1026646 2.1140828\n", " 0.71973133 0.6722164 0.25126696]\n" ] } ] }, { "cell_type": "code", "source": [ "print(\"\\n _____ACTION SPACE_____ \\n\")\n", "print(\"Action Space Shape\", env.action_space.n)\n", "print(\"Action Space Sample\", env.action_space.sample()) # Take a random action" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "SEPFCtEcjXEt", "outputId": "0d16eca3-2d85-4677-ef14-8b4b81b107a5" }, "execution_count": 5, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "\n", " _____ACTION SPACE_____ \n", "\n", "Action Space Shape 4\n", "Action Space Sample 1\n" ] } ] }, { "cell_type": "code", "source": [ "# Create the environment\n", "env = make_vec_env('LunarLander-v2', n_envs=16)" ], "metadata": { "id": "H9D4RSNbjiOI" }, "execution_count": 6, "outputs": [] }, { "cell_type": "code", "source": [ "# Create environment\n", "env = gym.make('LunarLander-v2')\n", "\n", "model = PPO(\n", " policy = 'MlpPolicy',\n", " env = env,\n", " n_steps = 1024,\n", " batch_size = 64,\n", " n_epochs = 4,\n", " gamma = 0.999,\n", " gae_lambda = 0.98,\n", " ent_coef = 0.01,\n", " verbose=1)" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "BDM864ltj0xF", "outputId": "f20febbc-fad1-4017-e53c-4d8f72c36ecc" }, "execution_count": 7, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Using cuda device\n", "Wrapping the env with a `Monitor` wrapper\n", "Wrapping the env in a DummyVecEnv.\n" ] } ] }, { "cell_type": "code", "source": [ "# Train the agent\n", "model.learn(total_timesteps=int(1e6))\n", "model_name = \"ppo-LunarLander-v2\"\n", "model.save(model_name)" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "hGEWL_bIknO1", "outputId": "a1943411-4319-4840-c57a-206041873d6c" }, "execution_count": 8, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "\u001b[1;30;43mStreaming output truncated to the last 5000 lines.\u001b[0m\n", "| value_loss | 395 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 577 |\n", "| ep_rew_mean | 185 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 740 |\n", "| time_elapsed | 1323 |\n", "| total_timesteps | 757760 |\n", "| train/ | |\n", "| approx_kl | 0.0042034434 |\n", "| clip_fraction | 0.0144 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.687 |\n", "| explained_variance | 0.97417665 |\n", "| learning_rate | 0.0003 |\n", "| loss | 7.09 |\n", "| n_updates | 2956 |\n", "| policy_gradient_loss | -0.000941 |\n", "| value_loss | 15.8 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 567 |\n", "| ep_rew_mean | 184 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 741 |\n", "| time_elapsed | 1324 |\n", "| total_timesteps | 758784 |\n", "| train/ | |\n", "| approx_kl | 0.0027432581 |\n", "| clip_fraction | 0.0061 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.772 |\n", "| explained_variance | 0.5152496 |\n", "| learning_rate | 0.0003 |\n", "| loss | 482 |\n", "| n_updates | 2960 |\n", "| policy_gradient_loss | -0.00334 |\n", "| value_loss | 708 |\n", "------------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 561 |\n", "| ep_rew_mean | 182 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 742 |\n", "| time_elapsed | 1326 |\n", "| total_timesteps | 759808 |\n", "| train/ | |\n", "| approx_kl | 0.00011096685 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.856 |\n", "| explained_variance | 0.4959107 |\n", "| learning_rate | 0.0003 |\n", "| loss | 715 |\n", "| n_updates | 2964 |\n", "| policy_gradient_loss | -0.000158 |\n", "| value_loss | 1.58e+03 |\n", "-------------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 559 |\n", "| ep_rew_mean | 182 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 743 |\n", "| time_elapsed | 1328 |\n", "| total_timesteps | 760832 |\n", "| train/ | |\n", "| approx_kl | 2.2239343e-05 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.831 |\n", "| explained_variance | 0.6606667 |\n", "| learning_rate | 0.0003 |\n", "| loss | 766 |\n", "| n_updates | 2968 |\n", "| policy_gradient_loss | -0.000103 |\n", "| value_loss | 1.08e+03 |\n", "-------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 553 |\n", "| ep_rew_mean | 180 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 744 |\n", "| time_elapsed | 1330 |\n", "| total_timesteps | 761856 |\n", "| train/ | |\n", "| approx_kl | 0.0006124177 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.807 |\n", "| explained_variance | 0.77966523 |\n", "| learning_rate | 0.0003 |\n", "| loss | 9.34 |\n", "| n_updates | 2972 |\n", "| policy_gradient_loss | -0.000191 |\n", "| value_loss | 77.9 |\n", "------------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 551 |\n", "| ep_rew_mean | 180 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 745 |\n", "| time_elapsed | 1331 |\n", "| total_timesteps | 762880 |\n", "| train/ | |\n", "| approx_kl | 0.00014669175 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.829 |\n", "| explained_variance | 0.65267545 |\n", "| learning_rate | 0.0003 |\n", "| loss | 121 |\n", "| n_updates | 2976 |\n", "| policy_gradient_loss | -0.000391 |\n", "| value_loss | 556 |\n", "-------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 556 |\n", "| ep_rew_mean | 179 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 746 |\n", "| time_elapsed | 1333 |\n", "| total_timesteps | 763904 |\n", "| train/ | |\n", "| approx_kl | 0.006000284 |\n", "| clip_fraction | 0.0176 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.661 |\n", "| explained_variance | 0.71720904 |\n", "| learning_rate | 0.0003 |\n", "| loss | 6.32 |\n", "| n_updates | 2980 |\n", "| policy_gradient_loss | -0.00252 |\n", "| value_loss | 54.1 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 548 |\n", "| ep_rew_mean | 182 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 747 |\n", "| time_elapsed | 1335 |\n", "| total_timesteps | 764928 |\n", "| train/ | |\n", "| approx_kl | 0.0036223517 |\n", "| clip_fraction | 0.0225 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.655 |\n", "| explained_variance | 0.9865678 |\n", "| learning_rate | 0.0003 |\n", "| loss | 2.21 |\n", "| n_updates | 2984 |\n", "| policy_gradient_loss | -0.00173 |\n", "| value_loss | 9.54 |\n", "------------------------------------------\n", "----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 535 |\n", "| ep_rew_mean | 183 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 748 |\n", "| time_elapsed | 1337 |\n", "| total_timesteps | 765952 |\n", "| train/ | |\n", "| approx_kl | 0.00528423 |\n", "| clip_fraction | 0.0374 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.833 |\n", "| explained_variance | 0.8088507 |\n", "| learning_rate | 0.0003 |\n", "| loss | 33.9 |\n", "| n_updates | 2988 |\n", "| policy_gradient_loss | -0.00162 |\n", "| value_loss | 86.5 |\n", "----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 535 |\n", "| ep_rew_mean | 183 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 749 |\n", "| time_elapsed | 1339 |\n", "| total_timesteps | 766976 |\n", "| train/ | |\n", "| approx_kl | 0.0035410176 |\n", "| clip_fraction | 0.0198 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.741 |\n", "| explained_variance | 0.950471 |\n", "| learning_rate | 0.0003 |\n", "| loss | 6.26 |\n", "| n_updates | 2992 |\n", "| policy_gradient_loss | -0.00339 |\n", "| value_loss | 18.3 |\n", "------------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 535 |\n", "| ep_rew_mean | 182 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 750 |\n", "| time_elapsed | 1340 |\n", "| total_timesteps | 768000 |\n", "| train/ | |\n", "| approx_kl | 0.00059015595 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.766 |\n", "| explained_variance | 0.48042 |\n", "| learning_rate | 0.0003 |\n", "| loss | 132 |\n", "| n_updates | 2996 |\n", "| policy_gradient_loss | 0.000369 |\n", "| value_loss | 958 |\n", "-------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 524 |\n", "| ep_rew_mean | 180 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 751 |\n", "| time_elapsed | 1342 |\n", "| total_timesteps | 769024 |\n", "| train/ | |\n", "| approx_kl | 0.004074127 |\n", "| clip_fraction | 0.0312 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.635 |\n", "| explained_variance | 0.9521401 |\n", "| learning_rate | 0.0003 |\n", "| loss | 9.16 |\n", "| n_updates | 3000 |\n", "| policy_gradient_loss | -0.00385 |\n", "| value_loss | 41.9 |\n", "-----------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 512 |\n", "| ep_rew_mean | 183 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 752 |\n", "| time_elapsed | 1344 |\n", "| total_timesteps | 770048 |\n", "| train/ | |\n", "| approx_kl | 0.00014795299 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.804 |\n", "| explained_variance | 0.20598006 |\n", "| learning_rate | 0.0003 |\n", "| loss | 1.23e+03 |\n", "| n_updates | 3004 |\n", "| policy_gradient_loss | 0.000138 |\n", "| value_loss | 1.72e+03 |\n", "-------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 506 |\n", "| ep_rew_mean | 184 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 753 |\n", "| time_elapsed | 1346 |\n", "| total_timesteps | 771072 |\n", "| train/ | |\n", "| approx_kl | 0.0033478313 |\n", "| clip_fraction | 0.0125 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.788 |\n", "| explained_variance | 0.93252504 |\n", "| learning_rate | 0.0003 |\n", "| loss | 11.2 |\n", "| n_updates | 3008 |\n", "| policy_gradient_loss | -0.00162 |\n", "| value_loss | 56.6 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 497 |\n", "| ep_rew_mean | 186 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 754 |\n", "| time_elapsed | 1348 |\n", "| total_timesteps | 772096 |\n", "| train/ | |\n", "| approx_kl | 0.0016964914 |\n", "| clip_fraction | 0.00513 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.725 |\n", "| explained_variance | 0.9674633 |\n", "| learning_rate | 0.0003 |\n", "| loss | 33.1 |\n", "| n_updates | 3012 |\n", "| policy_gradient_loss | -0.000742 |\n", "| value_loss | 56.2 |\n", "------------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 489 |\n", "| ep_rew_mean | 187 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 755 |\n", "| time_elapsed | 1349 |\n", "| total_timesteps | 773120 |\n", "| train/ | |\n", "| approx_kl | 8.0496655e-05 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.838 |\n", "| explained_variance | 0.5931463 |\n", "| learning_rate | 0.0003 |\n", "| loss | 151 |\n", "| n_updates | 3016 |\n", "| policy_gradient_loss | -0.00022 |\n", "| value_loss | 670 |\n", "-------------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 476 |\n", "| ep_rew_mean | 184 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 756 |\n", "| time_elapsed | 1351 |\n", "| total_timesteps | 774144 |\n", "| train/ | |\n", "| approx_kl | 0.00081147073 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.815 |\n", "| explained_variance | 0.61604786 |\n", "| learning_rate | 0.0003 |\n", "| loss | 28.3 |\n", "| n_updates | 3020 |\n", "| policy_gradient_loss | -0.000535 |\n", "| value_loss | 124 |\n", "-------------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 469 |\n", "| ep_rew_mean | 184 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 757 |\n", "| time_elapsed | 1353 |\n", "| total_timesteps | 775168 |\n", "| train/ | |\n", "| approx_kl | 0.00034849357 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.83 |\n", "| explained_variance | 0.4269191 |\n", "| learning_rate | 0.0003 |\n", "| loss | 597 |\n", "| n_updates | 3024 |\n", "| policy_gradient_loss | -0.000289 |\n", "| value_loss | 1.09e+03 |\n", "-------------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 471 |\n", "| ep_rew_mean | 184 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 758 |\n", "| time_elapsed | 1354 |\n", "| total_timesteps | 776192 |\n", "| train/ | |\n", "| approx_kl | 0.00088153535 |\n", "| clip_fraction | 0.00195 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.695 |\n", "| explained_variance | 0.9697084 |\n", "| learning_rate | 0.0003 |\n", "| loss | 26.4 |\n", "| n_updates | 3028 |\n", "| policy_gradient_loss | -0.00171 |\n", "| value_loss | 46.8 |\n", "-------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 477 |\n", "| ep_rew_mean | 183 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 759 |\n", "| time_elapsed | 1356 |\n", "| total_timesteps | 777216 |\n", "| train/ | |\n", "| approx_kl | 0.0002514213 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.747 |\n", "| explained_variance | 0.55965495 |\n", "| learning_rate | 0.0003 |\n", "| loss | 546 |\n", "| n_updates | 3032 |\n", "| policy_gradient_loss | -0.0004 |\n", "| value_loss | 1.1e+03 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 477 |\n", "| ep_rew_mean | 182 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 760 |\n", "| time_elapsed | 1358 |\n", "| total_timesteps | 778240 |\n", "| train/ | |\n", "| approx_kl | 0.0040037315 |\n", "| clip_fraction | 0.0178 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.53 |\n", "| explained_variance | 0.97577226 |\n", "| learning_rate | 0.0003 |\n", "| loss | 1.64 |\n", "| n_updates | 3036 |\n", "| policy_gradient_loss | -0.00127 |\n", "| value_loss | 7.63 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 475 |\n", "| ep_rew_mean | 186 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 761 |\n", "| time_elapsed | 1360 |\n", "| total_timesteps | 779264 |\n", "| train/ | |\n", "| approx_kl | 0.006242698 |\n", "| clip_fraction | 0.0227 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.845 |\n", "| explained_variance | 0.8915558 |\n", "| learning_rate | 0.0003 |\n", "| loss | 17.5 |\n", "| n_updates | 3040 |\n", "| policy_gradient_loss | -0.00198 |\n", "| value_loss | 56.6 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 474 |\n", "| ep_rew_mean | 186 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 762 |\n", "| time_elapsed | 1362 |\n", "| total_timesteps | 780288 |\n", "| train/ | |\n", "| approx_kl | 0.0076142084 |\n", "| clip_fraction | 0.0393 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.682 |\n", "| explained_variance | 0.9681996 |\n", "| learning_rate | 0.0003 |\n", "| loss | 11.9 |\n", "| n_updates | 3044 |\n", "| policy_gradient_loss | -0.000216 |\n", "| value_loss | 23.2 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 480 |\n", "| ep_rew_mean | 188 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 763 |\n", "| time_elapsed | 1363 |\n", "| total_timesteps | 781312 |\n", "| train/ | |\n", "| approx_kl | 0.0006723335 |\n", "| clip_fraction | 0.00146 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.81 |\n", "| explained_variance | 0.47269958 |\n", "| learning_rate | 0.0003 |\n", "| loss | 152 |\n", "| n_updates | 3048 |\n", "| policy_gradient_loss | -0.000821 |\n", "| value_loss | 715 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 481 |\n", "| ep_rew_mean | 190 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 764 |\n", "| time_elapsed | 1365 |\n", "| total_timesteps | 782336 |\n", "| train/ | |\n", "| approx_kl | 0.008285914 |\n", "| clip_fraction | 0.0356 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.713 |\n", "| explained_variance | 0.9687481 |\n", "| learning_rate | 0.0003 |\n", "| loss | 3.03 |\n", "| n_updates | 3052 |\n", "| policy_gradient_loss | -0.00237 |\n", "| value_loss | 12.2 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 485 |\n", "| ep_rew_mean | 192 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 765 |\n", "| time_elapsed | 1367 |\n", "| total_timesteps | 783360 |\n", "| train/ | |\n", "| approx_kl | 0.0024471045 |\n", "| clip_fraction | 0.022 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.752 |\n", "| explained_variance | 0.9126106 |\n", "| learning_rate | 0.0003 |\n", "| loss | 21.6 |\n", "| n_updates | 3056 |\n", "| policy_gradient_loss | 0.00573 |\n", "| value_loss | 76.6 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 487 |\n", "| ep_rew_mean | 192 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 766 |\n", "| time_elapsed | 1368 |\n", "| total_timesteps | 784384 |\n", "| train/ | |\n", "| approx_kl | 0.006487619 |\n", "| clip_fraction | 0.0339 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.784 |\n", "| explained_variance | 0.9855715 |\n", "| learning_rate | 0.0003 |\n", "| loss | 4.65 |\n", "| n_updates | 3060 |\n", "| policy_gradient_loss | -0.000587 |\n", "| value_loss | 13.4 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 487 |\n", "| ep_rew_mean | 192 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 767 |\n", "| time_elapsed | 1371 |\n", "| total_timesteps | 785408 |\n", "| train/ | |\n", "| approx_kl | 0.0028090219 |\n", "| clip_fraction | 0.00757 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.737 |\n", "| explained_variance | 0.5472819 |\n", "| learning_rate | 0.0003 |\n", "| loss | 299 |\n", "| n_updates | 3064 |\n", "| policy_gradient_loss | 0.000455 |\n", "| value_loss | 727 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 480 |\n", "| ep_rew_mean | 193 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 768 |\n", "| time_elapsed | 1372 |\n", "| total_timesteps | 786432 |\n", "| train/ | |\n", "| approx_kl | 0.0032782308 |\n", "| clip_fraction | 0.0156 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.724 |\n", "| explained_variance | 0.9482073 |\n", "| learning_rate | 0.0003 |\n", "| loss | 18.6 |\n", "| n_updates | 3068 |\n", "| policy_gradient_loss | -0.00089 |\n", "| value_loss | 32.2 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 483 |\n", "| ep_rew_mean | 194 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 769 |\n", "| time_elapsed | 1374 |\n", "| total_timesteps | 787456 |\n", "| train/ | |\n", "| approx_kl | 0.0020764142 |\n", "| clip_fraction | 0.00244 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.772 |\n", "| explained_variance | 0.8550257 |\n", "| learning_rate | 0.0003 |\n", "| loss | 6.56 |\n", "| n_updates | 3072 |\n", "| policy_gradient_loss | -0.00175 |\n", "| value_loss | 54.1 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 473 |\n", "| ep_rew_mean | 192 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 770 |\n", "| time_elapsed | 1376 |\n", "| total_timesteps | 788480 |\n", "| train/ | |\n", "| approx_kl | 0.0033340114 |\n", "| clip_fraction | 0.0181 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.65 |\n", "| explained_variance | 0.9382707 |\n", "| learning_rate | 0.0003 |\n", "| loss | 10.7 |\n", "| n_updates | 3076 |\n", "| policy_gradient_loss | -0.00228 |\n", "| value_loss | 27.3 |\n", "------------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 467 |\n", "| ep_rew_mean | 193 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 771 |\n", "| time_elapsed | 1377 |\n", "| total_timesteps | 789504 |\n", "| train/ | |\n", "| approx_kl | 0.00042752596 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.749 |\n", "| explained_variance | 0.5673845 |\n", "| learning_rate | 0.0003 |\n", "| loss | 453 |\n", "| n_updates | 3080 |\n", "| policy_gradient_loss | 0.000286 |\n", "| value_loss | 687 |\n", "-------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 467 |\n", "| ep_rew_mean | 193 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 772 |\n", "| time_elapsed | 1379 |\n", "| total_timesteps | 790528 |\n", "| train/ | |\n", "| approx_kl | 0.0015281553 |\n", "| clip_fraction | 0.00244 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.794 |\n", "| explained_variance | 0.82194614 |\n", "| learning_rate | 0.0003 |\n", "| loss | 25.1 |\n", "| n_updates | 3084 |\n", "| policy_gradient_loss | -0.000521 |\n", "| value_loss | 91.4 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 469 |\n", "| ep_rew_mean | 194 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 773 |\n", "| time_elapsed | 1381 |\n", "| total_timesteps | 791552 |\n", "| train/ | |\n", "| approx_kl | 0.0030053323 |\n", "| clip_fraction | 0.0198 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.717 |\n", "| explained_variance | 0.93970346 |\n", "| learning_rate | 0.0003 |\n", "| loss | 4.59 |\n", "| n_updates | 3088 |\n", "| policy_gradient_loss | -0.00328 |\n", "| value_loss | 22.3 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 461 |\n", "| ep_rew_mean | 195 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 774 |\n", "| time_elapsed | 1383 |\n", "| total_timesteps | 792576 |\n", "| train/ | |\n", "| approx_kl | 0.0025847415 |\n", "| clip_fraction | 0.0105 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.719 |\n", "| explained_variance | 0.9400718 |\n", "| learning_rate | 0.0003 |\n", "| loss | 8.56 |\n", "| n_updates | 3092 |\n", "| policy_gradient_loss | -0.00223 |\n", "| value_loss | 29.3 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 467 |\n", "| ep_rew_mean | 194 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 775 |\n", "| time_elapsed | 1385 |\n", "| total_timesteps | 793600 |\n", "| train/ | |\n", "| approx_kl | 0.005926219 |\n", "| clip_fraction | 0.0417 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.744 |\n", "| explained_variance | 0.778955 |\n", "| learning_rate | 0.0003 |\n", "| loss | 13.9 |\n", "| n_updates | 3096 |\n", "| policy_gradient_loss | -0.00634 |\n", "| value_loss | 82.9 |\n", "-----------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 467 |\n", "| ep_rew_mean | 191 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 776 |\n", "| time_elapsed | 1386 |\n", "| total_timesteps | 794624 |\n", "| train/ | |\n", "| approx_kl | 0.014876015 |\n", "| clip_fraction | 0.135 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.74 |\n", "| explained_variance | 0.9827518 |\n", "| learning_rate | 0.0003 |\n", "| loss | 1.09 |\n", "| n_updates | 3100 |\n", "| policy_gradient_loss | -0.00145 |\n", "| value_loss | 5.4 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 461 |\n", "| ep_rew_mean | 192 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 777 |\n", "| time_elapsed | 1388 |\n", "| total_timesteps | 795648 |\n", "| train/ | |\n", "| approx_kl | 0.0055106683 |\n", "| clip_fraction | 0.0605 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.735 |\n", "| explained_variance | 0.3772092 |\n", "| learning_rate | 0.0003 |\n", "| loss | 447 |\n", "| n_updates | 3104 |\n", "| policy_gradient_loss | -0.00236 |\n", "| value_loss | 1.06e+03 |\n", "------------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 456 |\n", "| ep_rew_mean | 193 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 778 |\n", "| time_elapsed | 1390 |\n", "| total_timesteps | 796672 |\n", "| train/ | |\n", "| approx_kl | 0.00040896563 |\n", "| clip_fraction | 0.000732 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.778 |\n", "| explained_variance | 0.58248556 |\n", "| learning_rate | 0.0003 |\n", "| loss | 106 |\n", "| n_updates | 3108 |\n", "| policy_gradient_loss | -0.00211 |\n", "| value_loss | 410 |\n", "-------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 462 |\n", "| ep_rew_mean | 193 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 779 |\n", "| time_elapsed | 1392 |\n", "| total_timesteps | 797696 |\n", "| train/ | |\n", "| approx_kl | 0.0013226686 |\n", "| clip_fraction | 0.00879 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.585 |\n", "| explained_variance | 0.8369969 |\n", "| learning_rate | 0.0003 |\n", "| loss | 4.11 |\n", "| n_updates | 3112 |\n", "| policy_gradient_loss | -0.00274 |\n", "| value_loss | 25.6 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 459 |\n", "| ep_rew_mean | 191 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 780 |\n", "| time_elapsed | 1393 |\n", "| total_timesteps | 798720 |\n", "| train/ | |\n", "| approx_kl | 0.007834792 |\n", "| clip_fraction | 0.0618 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.784 |\n", "| explained_variance | 0.9613589 |\n", "| learning_rate | 0.0003 |\n", "| loss | 5.79 |\n", "| n_updates | 3116 |\n", "| policy_gradient_loss | -0.00272 |\n", "| value_loss | 15.8 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 460 |\n", "| ep_rew_mean | 191 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 781 |\n", "| time_elapsed | 1395 |\n", "| total_timesteps | 799744 |\n", "| train/ | |\n", "| approx_kl | 0.0051701535 |\n", "| clip_fraction | 0.063 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.704 |\n", "| explained_variance | 0.97058314 |\n", "| learning_rate | 0.0003 |\n", "| loss | 8.68 |\n", "| n_updates | 3120 |\n", "| policy_gradient_loss | -0.00296 |\n", "| value_loss | 17.6 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 461 |\n", "| ep_rew_mean | 191 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 782 |\n", "| time_elapsed | 1397 |\n", "| total_timesteps | 800768 |\n", "| train/ | |\n", "| approx_kl | 0.0013496582 |\n", "| clip_fraction | 0.0112 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.842 |\n", "| explained_variance | 0.9269048 |\n", "| learning_rate | 0.0003 |\n", "| loss | 3.93 |\n", "| n_updates | 3124 |\n", "| policy_gradient_loss | -0.000805 |\n", "| value_loss | 13.9 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 459 |\n", "| ep_rew_mean | 193 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 783 |\n", "| time_elapsed | 1399 |\n", "| total_timesteps | 801792 |\n", "| train/ | |\n", "| approx_kl | 0.003748878 |\n", "| clip_fraction | 0.00928 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.844 |\n", "| explained_variance | 0.91236943 |\n", "| learning_rate | 0.0003 |\n", "| loss | 3.12 |\n", "| n_updates | 3128 |\n", "| policy_gradient_loss | 0.00058 |\n", "| value_loss | 15.9 |\n", "-----------------------------------------\n", "----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 456 |\n", "| ep_rew_mean | 196 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 784 |\n", "| time_elapsed | 1400 |\n", "| total_timesteps | 802816 |\n", "| train/ | |\n", "| approx_kl | 0.00627237 |\n", "| clip_fraction | 0.0359 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.751 |\n", "| explained_variance | 0.9670936 |\n", "| learning_rate | 0.0003 |\n", "| loss | 2.57 |\n", "| n_updates | 3132 |\n", "| policy_gradient_loss | 0.000793 |\n", "| value_loss | 8.46 |\n", "----------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 458 |\n", "| ep_rew_mean | 197 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 785 |\n", "| time_elapsed | 1402 |\n", "| total_timesteps | 803840 |\n", "| train/ | |\n", "| approx_kl | 0.007687486 |\n", "| clip_fraction | 0.074 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.763 |\n", "| explained_variance | 0.97563607 |\n", "| learning_rate | 0.0003 |\n", "| loss | 3.22 |\n", "| n_updates | 3136 |\n", "| policy_gradient_loss | 0.0016 |\n", "| value_loss | 8.15 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 461 |\n", "| ep_rew_mean | 200 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 786 |\n", "| time_elapsed | 1404 |\n", "| total_timesteps | 804864 |\n", "| train/ | |\n", "| approx_kl | 0.0040891673 |\n", "| clip_fraction | 0.0115 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.835 |\n", "| explained_variance | 0.9112801 |\n", "| learning_rate | 0.0003 |\n", "| loss | 4.38 |\n", "| n_updates | 3140 |\n", "| policy_gradient_loss | -0.000636 |\n", "| value_loss | 12.2 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 464 |\n", "| ep_rew_mean | 204 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 787 |\n", "| time_elapsed | 1406 |\n", "| total_timesteps | 805888 |\n", "| train/ | |\n", "| approx_kl | 0.0011699456 |\n", "| clip_fraction | 0.00195 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.715 |\n", "| explained_variance | 0.9241893 |\n", "| learning_rate | 0.0003 |\n", "| loss | 10.2 |\n", "| n_updates | 3144 |\n", "| policy_gradient_loss | 0.000917 |\n", "| value_loss | 28.2 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 466 |\n", "| ep_rew_mean | 205 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 788 |\n", "| time_elapsed | 1408 |\n", "| total_timesteps | 806912 |\n", "| train/ | |\n", "| approx_kl | 0.0053148256 |\n", "| clip_fraction | 0.0383 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.76 |\n", "| explained_variance | 0.97953594 |\n", "| learning_rate | 0.0003 |\n", "| loss | 4.96 |\n", "| n_updates | 3148 |\n", "| policy_gradient_loss | -0.00479 |\n", "| value_loss | 8.98 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 466 |\n", "| ep_rew_mean | 205 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 789 |\n", "| time_elapsed | 1410 |\n", "| total_timesteps | 807936 |\n", "| train/ | |\n", "| approx_kl | 0.0035671087 |\n", "| clip_fraction | 0.0347 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.809 |\n", "| explained_variance | 0.96757674 |\n", "| learning_rate | 0.0003 |\n", "| loss | 4.49 |\n", "| n_updates | 3152 |\n", "| policy_gradient_loss | -0.00533 |\n", "| value_loss | 13.9 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 468 |\n", "| ep_rew_mean | 208 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 790 |\n", "| time_elapsed | 1411 |\n", "| total_timesteps | 808960 |\n", "| train/ | |\n", "| approx_kl | 0.006744018 |\n", "| clip_fraction | 0.0393 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.764 |\n", "| explained_variance | 0.965472 |\n", "| learning_rate | 0.0003 |\n", "| loss | 5.7 |\n", "| n_updates | 3156 |\n", "| policy_gradient_loss | -0.0049 |\n", "| value_loss | 22.6 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 458 |\n", "| ep_rew_mean | 209 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 791 |\n", "| time_elapsed | 1413 |\n", "| total_timesteps | 809984 |\n", "| train/ | |\n", "| approx_kl | 0.0050601778 |\n", "| clip_fraction | 0.0283 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.818 |\n", "| explained_variance | 0.91442895 |\n", "| learning_rate | 0.0003 |\n", "| loss | 17.3 |\n", "| n_updates | 3160 |\n", "| policy_gradient_loss | -0.00418 |\n", "| value_loss | 34.9 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 458 |\n", "| ep_rew_mean | 209 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 792 |\n", "| time_elapsed | 1415 |\n", "| total_timesteps | 811008 |\n", "| train/ | |\n", "| approx_kl | 0.0046395985 |\n", "| clip_fraction | 0.0232 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.805 |\n", "| explained_variance | 0.9707044 |\n", "| learning_rate | 0.0003 |\n", "| loss | 2.79 |\n", "| n_updates | 3164 |\n", "| policy_gradient_loss | -0.000748 |\n", "| value_loss | 8.79 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 459 |\n", "| ep_rew_mean | 210 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 793 |\n", "| time_elapsed | 1416 |\n", "| total_timesteps | 812032 |\n", "| train/ | |\n", "| approx_kl | 0.0032754834 |\n", "| clip_fraction | 0.0134 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.777 |\n", "| explained_variance | 0.95957685 |\n", "| learning_rate | 0.0003 |\n", "| loss | 13.8 |\n", "| n_updates | 3168 |\n", "| policy_gradient_loss | -0.00125 |\n", "| value_loss | 29.6 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 458 |\n", "| ep_rew_mean | 210 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 794 |\n", "| time_elapsed | 1418 |\n", "| total_timesteps | 813056 |\n", "| train/ | |\n", "| approx_kl | 0.0006216647 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.814 |\n", "| explained_variance | 0.515272 |\n", "| learning_rate | 0.0003 |\n", "| loss | 369 |\n", "| n_updates | 3172 |\n", "| policy_gradient_loss | 0.000301 |\n", "| value_loss | 942 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 456 |\n", "| ep_rew_mean | 211 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 795 |\n", "| time_elapsed | 1420 |\n", "| total_timesteps | 814080 |\n", "| train/ | |\n", "| approx_kl | 0.0034800367 |\n", "| clip_fraction | 0.0298 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.827 |\n", "| explained_variance | 0.9711719 |\n", "| learning_rate | 0.0003 |\n", "| loss | 7.01 |\n", "| n_updates | 3176 |\n", "| policy_gradient_loss | -0.00494 |\n", "| value_loss | 17.1 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 461 |\n", "| ep_rew_mean | 213 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 796 |\n", "| time_elapsed | 1422 |\n", "| total_timesteps | 815104 |\n", "| train/ | |\n", "| approx_kl | 0.0023466456 |\n", "| clip_fraction | 0.00928 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.696 |\n", "| explained_variance | 0.9553854 |\n", "| learning_rate | 0.0003 |\n", "| loss | 15.1 |\n", "| n_updates | 3180 |\n", "| policy_gradient_loss | -0.00178 |\n", "| value_loss | 24.4 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 455 |\n", "| ep_rew_mean | 214 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 797 |\n", "| time_elapsed | 1424 |\n", "| total_timesteps | 816128 |\n", "| train/ | |\n", "| approx_kl | 0.0012794463 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.72 |\n", "| explained_variance | 0.49472117 |\n", "| learning_rate | 0.0003 |\n", "| loss | 457 |\n", "| n_updates | 3184 |\n", "| policy_gradient_loss | 0.000147 |\n", "| value_loss | 1.18e+03 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 456 |\n", "| ep_rew_mean | 215 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 798 |\n", "| time_elapsed | 1425 |\n", "| total_timesteps | 817152 |\n", "| train/ | |\n", "| approx_kl | 0.005656508 |\n", "| clip_fraction | 0.0527 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.791 |\n", "| explained_variance | 0.96763396 |\n", "| learning_rate | 0.0003 |\n", "| loss | 3.64 |\n", "| n_updates | 3188 |\n", "| policy_gradient_loss | -0.00613 |\n", "| value_loss | 14.1 |\n", "-----------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 459 |\n", "| ep_rew_mean | 218 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 799 |\n", "| time_elapsed | 1427 |\n", "| total_timesteps | 818176 |\n", "| train/ | |\n", "| approx_kl | 0.005392296 |\n", "| clip_fraction | 0.0679 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.742 |\n", "| explained_variance | 0.95543116 |\n", "| learning_rate | 0.0003 |\n", "| loss | 8.53 |\n", "| n_updates | 3192 |\n", "| policy_gradient_loss | -0.00401 |\n", "| value_loss | 37.8 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 464 |\n", "| ep_rew_mean | 218 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 800 |\n", "| time_elapsed | 1429 |\n", "| total_timesteps | 819200 |\n", "| train/ | |\n", "| approx_kl | 0.0034478847 |\n", "| clip_fraction | 0.0439 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.781 |\n", "| explained_variance | 0.9666716 |\n", "| learning_rate | 0.0003 |\n", "| loss | 9.52 |\n", "| n_updates | 3196 |\n", "| policy_gradient_loss | -0.0019 |\n", "| value_loss | 25.4 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 465 |\n", "| ep_rew_mean | 219 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 801 |\n", "| time_elapsed | 1431 |\n", "| total_timesteps | 820224 |\n", "| train/ | |\n", "| approx_kl | 0.004370408 |\n", "| clip_fraction | 0.0254 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.645 |\n", "| explained_variance | 0.9447645 |\n", "| learning_rate | 0.0003 |\n", "| loss | 6.15 |\n", "| n_updates | 3200 |\n", "| policy_gradient_loss | -0.00158 |\n", "| value_loss | 16.2 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 468 |\n", "| ep_rew_mean | 219 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 802 |\n", "| time_elapsed | 1433 |\n", "| total_timesteps | 821248 |\n", "| train/ | |\n", "| approx_kl | 0.0008130599 |\n", "| clip_fraction | 0.00171 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.88 |\n", "| explained_variance | 0.5174211 |\n", "| learning_rate | 0.0003 |\n", "| loss | 208 |\n", "| n_updates | 3204 |\n", "| policy_gradient_loss | -0.00188 |\n", "| value_loss | 810 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 467 |\n", "| ep_rew_mean | 213 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 803 |\n", "| time_elapsed | 1435 |\n", "| total_timesteps | 822272 |\n", "| train/ | |\n", "| approx_kl | 0.004970277 |\n", "| clip_fraction | 0.0166 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.684 |\n", "| explained_variance | 0.9515542 |\n", "| learning_rate | 0.0003 |\n", "| loss | 11.6 |\n", "| n_updates | 3208 |\n", "| policy_gradient_loss | 1.59e-05 |\n", "| value_loss | 25.1 |\n", "-----------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 462 |\n", "| ep_rew_mean | 215 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 804 |\n", "| time_elapsed | 1436 |\n", "| total_timesteps | 823296 |\n", "| train/ | |\n", "| approx_kl | 0.00014796236 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.822 |\n", "| explained_variance | 0.52352965 |\n", "| learning_rate | 0.0003 |\n", "| loss | 1.11e+03 |\n", "| n_updates | 3212 |\n", "| policy_gradient_loss | 0.000105 |\n", "| value_loss | 1.83e+03 |\n", "-------------------------------------------\n", "--------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 462 |\n", "| ep_rew_mean | 216 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 805 |\n", "| time_elapsed | 1438 |\n", "| total_timesteps | 824320 |\n", "| train/ | |\n", "| approx_kl | 1.04295905e-05 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.79 |\n", "| explained_variance | 0.5113547 |\n", "| learning_rate | 0.0003 |\n", "| loss | 310 |\n", "| n_updates | 3216 |\n", "| policy_gradient_loss | -4.09e-05 |\n", "| value_loss | 620 |\n", "--------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 457 |\n", "| ep_rew_mean | 212 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 806 |\n", "| time_elapsed | 1440 |\n", "| total_timesteps | 825344 |\n", "| train/ | |\n", "| approx_kl | 0.0031212345 |\n", "| clip_fraction | 0.00781 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.685 |\n", "| explained_variance | 0.91437423 |\n", "| learning_rate | 0.0003 |\n", "| loss | 21.8 |\n", "| n_updates | 3220 |\n", "| policy_gradient_loss | -0.0025 |\n", "| value_loss | 64.4 |\n", "------------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 463 |\n", "| ep_rew_mean | 211 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 807 |\n", "| time_elapsed | 1442 |\n", "| total_timesteps | 826368 |\n", "| train/ | |\n", "| approx_kl | 0.00029566005 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.862 |\n", "| explained_variance | 0.32723856 |\n", "| learning_rate | 0.0003 |\n", "| loss | 724 |\n", "| n_updates | 3224 |\n", "| policy_gradient_loss | -0.000621 |\n", "| value_loss | 1.65e+03 |\n", "-------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 464 |\n", "| ep_rew_mean | 213 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 808 |\n", "| time_elapsed | 1444 |\n", "| total_timesteps | 827392 |\n", "| train/ | |\n", "| approx_kl | 0.0090375235 |\n", "| clip_fraction | 0.107 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.706 |\n", "| explained_variance | 0.98061967 |\n", "| learning_rate | 0.0003 |\n", "| loss | 2.05 |\n", "| n_updates | 3228 |\n", "| policy_gradient_loss | -0.00509 |\n", "| value_loss | 7.86 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 465 |\n", "| ep_rew_mean | 213 |\n", "| time/ | |\n", "| fps | 572 |\n", "| iterations | 809 |\n", "| time_elapsed | 1445 |\n", "| total_timesteps | 828416 |\n", "| train/ | |\n", "| approx_kl | 0.005017871 |\n", "| clip_fraction | 0.0286 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.75 |\n", "| explained_variance | 0.9234112 |\n", "| learning_rate | 0.0003 |\n", "| loss | 5 |\n", "| n_updates | 3232 |\n", "| policy_gradient_loss | -0.00133 |\n", "| value_loss | 23.3 |\n", "-----------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 456 |\n", "| ep_rew_mean | 212 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 810 |\n", "| time_elapsed | 1447 |\n", "| total_timesteps | 829440 |\n", "| train/ | |\n", "| approx_kl | 0.006119647 |\n", "| clip_fraction | 0.033 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.817 |\n", "| explained_variance | 0.9742842 |\n", "| learning_rate | 0.0003 |\n", "| loss | 4.98 |\n", "| n_updates | 3236 |\n", "| policy_gradient_loss | -0.00416 |\n", "| value_loss | 18.4 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 456 |\n", "| ep_rew_mean | 213 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 811 |\n", "| time_elapsed | 1449 |\n", "| total_timesteps | 830464 |\n", "| train/ | |\n", "| approx_kl | 0.0015127202 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.806 |\n", "| explained_variance | 0.44570506 |\n", "| learning_rate | 0.0003 |\n", "| loss | 75.6 |\n", "| n_updates | 3240 |\n", "| policy_gradient_loss | -0.00189 |\n", "| value_loss | 825 |\n", "------------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 455 |\n", "| ep_rew_mean | 210 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 812 |\n", "| time_elapsed | 1450 |\n", "| total_timesteps | 831488 |\n", "| train/ | |\n", "| approx_kl | 0.00021065498 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.867 |\n", "| explained_variance | 0.45709783 |\n", "| learning_rate | 0.0003 |\n", "| loss | 329 |\n", "| n_updates | 3244 |\n", "| policy_gradient_loss | -0.000366 |\n", "| value_loss | 797 |\n", "-------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 457 |\n", "| ep_rew_mean | 210 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 813 |\n", "| time_elapsed | 1452 |\n", "| total_timesteps | 832512 |\n", "| train/ | |\n", "| approx_kl | 0.0006038125 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.859 |\n", "| explained_variance | 0.5473994 |\n", "| learning_rate | 0.0003 |\n", "| loss | 279 |\n", "| n_updates | 3248 |\n", "| policy_gradient_loss | -0.00019 |\n", "| value_loss | 655 |\n", "------------------------------------------\n", "----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 453 |\n", "| ep_rew_mean | 212 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 814 |\n", "| time_elapsed | 1454 |\n", "| total_timesteps | 833536 |\n", "| train/ | |\n", "| approx_kl | 0.00443552 |\n", "| clip_fraction | 0.0159 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.683 |\n", "| explained_variance | 0.90832573 |\n", "| learning_rate | 0.0003 |\n", "| loss | 18 |\n", "| n_updates | 3252 |\n", "| policy_gradient_loss | -0.00144 |\n", "| value_loss | 41.8 |\n", "----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 450 |\n", "| ep_rew_mean | 209 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 815 |\n", "| time_elapsed | 1456 |\n", "| total_timesteps | 834560 |\n", "| train/ | |\n", "| approx_kl | 0.0035896853 |\n", "| clip_fraction | 0.0134 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.711 |\n", "| explained_variance | 0.8776821 |\n", "| learning_rate | 0.0003 |\n", "| loss | 11.1 |\n", "| n_updates | 3256 |\n", "| policy_gradient_loss | -0.00223 |\n", "| value_loss | 33.1 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 450 |\n", "| ep_rew_mean | 205 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 816 |\n", "| time_elapsed | 1458 |\n", "| total_timesteps | 835584 |\n", "| train/ | |\n", "| approx_kl | 0.000368813 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.873 |\n", "| explained_variance | 0.35390645 |\n", "| learning_rate | 0.0003 |\n", "| loss | 790 |\n", "| n_updates | 3260 |\n", "| policy_gradient_loss | -0.000215 |\n", "| value_loss | 1.57e+03 |\n", "-----------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 448 |\n", "| ep_rew_mean | 206 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 817 |\n", "| time_elapsed | 1459 |\n", "| total_timesteps | 836608 |\n", "| train/ | |\n", "| approx_kl | 0.00031387404 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.791 |\n", "| explained_variance | 0.4154219 |\n", "| learning_rate | 0.0003 |\n", "| loss | 382 |\n", "| n_updates | 3264 |\n", "| policy_gradient_loss | -0.000216 |\n", "| value_loss | 674 |\n", "-------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 451 |\n", "| ep_rew_mean | 203 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 818 |\n", "| time_elapsed | 1461 |\n", "| total_timesteps | 837632 |\n", "| train/ | |\n", "| approx_kl | 0.006108832 |\n", "| clip_fraction | 0.0281 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.836 |\n", "| explained_variance | 0.6196294 |\n", "| learning_rate | 0.0003 |\n", "| loss | 33.3 |\n", "| n_updates | 3268 |\n", "| policy_gradient_loss | -0.00266 |\n", "| value_loss | 76.6 |\n", "-----------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 445 |\n", "| ep_rew_mean | 205 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 819 |\n", "| time_elapsed | 1463 |\n", "| total_timesteps | 838656 |\n", "| train/ | |\n", "| approx_kl | 0.00015586335 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.815 |\n", "| explained_variance | 0.59229076 |\n", "| learning_rate | 0.0003 |\n", "| loss | 152 |\n", "| n_updates | 3272 |\n", "| policy_gradient_loss | -0.00025 |\n", "| value_loss | 618 |\n", "-------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 449 |\n", "| ep_rew_mean | 209 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 820 |\n", "| time_elapsed | 1464 |\n", "| total_timesteps | 839680 |\n", "| train/ | |\n", "| approx_kl | 0.002189963 |\n", "| clip_fraction | 0.00537 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.774 |\n", "| explained_variance | 0.8516287 |\n", "| learning_rate | 0.0003 |\n", "| loss | 31.9 |\n", "| n_updates | 3276 |\n", "| policy_gradient_loss | -0.00149 |\n", "| value_loss | 107 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 451 |\n", "| ep_rew_mean | 209 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 821 |\n", "| time_elapsed | 1466 |\n", "| total_timesteps | 840704 |\n", "| train/ | |\n", "| approx_kl | 0.0043054977 |\n", "| clip_fraction | 0.0164 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.794 |\n", "| explained_variance | 0.7804343 |\n", "| learning_rate | 0.0003 |\n", "| loss | 25.2 |\n", "| n_updates | 3280 |\n", "| policy_gradient_loss | -0.0014 |\n", "| value_loss | 74.4 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 444 |\n", "| ep_rew_mean | 206 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 822 |\n", "| time_elapsed | 1468 |\n", "| total_timesteps | 841728 |\n", "| train/ | |\n", "| approx_kl | 0.002112137 |\n", "| clip_fraction | 0.00513 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.797 |\n", "| explained_variance | 0.9039548 |\n", "| learning_rate | 0.0003 |\n", "| loss | 8.85 |\n", "| n_updates | 3284 |\n", "| policy_gradient_loss | -0.000834 |\n", "| value_loss | 35 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 450 |\n", "| ep_rew_mean | 205 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 823 |\n", "| time_elapsed | 1470 |\n", "| total_timesteps | 842752 |\n", "| train/ | |\n", "| approx_kl | 0.0010862828 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.856 |\n", "| explained_variance | 0.51115274 |\n", "| learning_rate | 0.0003 |\n", "| loss | 636 |\n", "| n_updates | 3288 |\n", "| policy_gradient_loss | -0.000843 |\n", "| value_loss | 905 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 449 |\n", "| ep_rew_mean | 206 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 824 |\n", "| time_elapsed | 1472 |\n", "| total_timesteps | 843776 |\n", "| train/ | |\n", "| approx_kl | 0.007972829 |\n", "| clip_fraction | 0.0469 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.573 |\n", "| explained_variance | 0.86519 |\n", "| learning_rate | 0.0003 |\n", "| loss | 3.31 |\n", "| n_updates | 3292 |\n", "| policy_gradient_loss | -0.00348 |\n", "| value_loss | 15.8 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 450 |\n", "| ep_rew_mean | 206 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 825 |\n", "| time_elapsed | 1473 |\n", "| total_timesteps | 844800 |\n", "| train/ | |\n", "| approx_kl | 0.0030525909 |\n", "| clip_fraction | 0.0413 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.8 |\n", "| explained_variance | 0.92672074 |\n", "| learning_rate | 0.0003 |\n", "| loss | 5.69 |\n", "| n_updates | 3296 |\n", "| policy_gradient_loss | -0.00237 |\n", "| value_loss | 15.3 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 450 |\n", "| ep_rew_mean | 207 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 826 |\n", "| time_elapsed | 1475 |\n", "| total_timesteps | 845824 |\n", "| train/ | |\n", "| approx_kl | 0.002864468 |\n", "| clip_fraction | 0.0447 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.816 |\n", "| explained_variance | 0.9123099 |\n", "| learning_rate | 0.0003 |\n", "| loss | 4.33 |\n", "| n_updates | 3300 |\n", "| policy_gradient_loss | -0.00193 |\n", "| value_loss | 22 |\n", "-----------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 450 |\n", "| ep_rew_mean | 207 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 827 |\n", "| time_elapsed | 1477 |\n", "| total_timesteps | 846848 |\n", "| train/ | |\n", "| approx_kl | 0.003244643 |\n", "| clip_fraction | 0.0247 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.842 |\n", "| explained_variance | 0.942331 |\n", "| learning_rate | 0.0003 |\n", "| loss | 5.02 |\n", "| n_updates | 3304 |\n", "| policy_gradient_loss | -0.00347 |\n", "| value_loss | 18 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 450 |\n", "| ep_rew_mean | 207 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 828 |\n", "| time_elapsed | 1479 |\n", "| total_timesteps | 847872 |\n", "| train/ | |\n", "| approx_kl | 0.0029303688 |\n", "| clip_fraction | 0.0281 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.736 |\n", "| explained_variance | 0.8256559 |\n", "| learning_rate | 0.0003 |\n", "| loss | 7.43 |\n", "| n_updates | 3308 |\n", "| policy_gradient_loss | -0.00123 |\n", "| value_loss | 34.3 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 451 |\n", "| ep_rew_mean | 207 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 829 |\n", "| time_elapsed | 1481 |\n", "| total_timesteps | 848896 |\n", "| train/ | |\n", "| approx_kl | 0.009592405 |\n", "| clip_fraction | 0.0623 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.836 |\n", "| explained_variance | 0.96280015 |\n", "| learning_rate | 0.0003 |\n", "| loss | 2.42 |\n", "| n_updates | 3312 |\n", "| policy_gradient_loss | -0.00363 |\n", "| value_loss | 7.89 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 449 |\n", "| ep_rew_mean | 207 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 830 |\n", "| time_elapsed | 1482 |\n", "| total_timesteps | 849920 |\n", "| train/ | |\n", "| approx_kl | 0.0056061675 |\n", "| clip_fraction | 0.0586 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.846 |\n", "| explained_variance | 0.94896996 |\n", "| learning_rate | 0.0003 |\n", "| loss | 3.53 |\n", "| n_updates | 3316 |\n", "| policy_gradient_loss | -0.00219 |\n", "| value_loss | 12.1 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 450 |\n", "| ep_rew_mean | 207 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 831 |\n", "| time_elapsed | 1484 |\n", "| total_timesteps | 850944 |\n", "| train/ | |\n", "| approx_kl | 0.0034652464 |\n", "| clip_fraction | 0.0115 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.706 |\n", "| explained_variance | 0.9485093 |\n", "| learning_rate | 0.0003 |\n", "| loss | 8.57 |\n", "| n_updates | 3320 |\n", "| policy_gradient_loss | -0.000113 |\n", "| value_loss | 19.1 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 455 |\n", "| ep_rew_mean | 205 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 832 |\n", "| time_elapsed | 1486 |\n", "| total_timesteps | 851968 |\n", "| train/ | |\n", "| approx_kl | 0.011424896 |\n", "| clip_fraction | 0.0845 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.764 |\n", "| explained_variance | 0.9810066 |\n", "| learning_rate | 0.0003 |\n", "| loss | 2.92 |\n", "| n_updates | 3324 |\n", "| policy_gradient_loss | -0.00488 |\n", "| value_loss | 5.6 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 456 |\n", "| ep_rew_mean | 205 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 833 |\n", "| time_elapsed | 1487 |\n", "| total_timesteps | 852992 |\n", "| train/ | |\n", "| approx_kl | 0.0027892482 |\n", "| clip_fraction | 0.0649 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.751 |\n", "| explained_variance | 0.96821916 |\n", "| learning_rate | 0.0003 |\n", "| loss | 18.4 |\n", "| n_updates | 3328 |\n", "| policy_gradient_loss | 0.00387 |\n", "| value_loss | 32.5 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 457 |\n", "| ep_rew_mean | 205 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 834 |\n", "| time_elapsed | 1489 |\n", "| total_timesteps | 854016 |\n", "| train/ | |\n", "| approx_kl | 0.0044964897 |\n", "| clip_fraction | 0.0186 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.792 |\n", "| explained_variance | 0.9708647 |\n", "| learning_rate | 0.0003 |\n", "| loss | 5.04 |\n", "| n_updates | 3332 |\n", "| policy_gradient_loss | -0.000834 |\n", "| value_loss | 15.9 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 458 |\n", "| ep_rew_mean | 204 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 835 |\n", "| time_elapsed | 1491 |\n", "| total_timesteps | 855040 |\n", "| train/ | |\n", "| approx_kl | 0.007305797 |\n", "| clip_fraction | 0.0457 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.78 |\n", "| explained_variance | 0.9834209 |\n", "| learning_rate | 0.0003 |\n", "| loss | 2.95 |\n", "| n_updates | 3336 |\n", "| policy_gradient_loss | -0.00584 |\n", "| value_loss | 6.97 |\n", "-----------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 460 |\n", "| ep_rew_mean | 204 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 836 |\n", "| time_elapsed | 1493 |\n", "| total_timesteps | 856064 |\n", "| train/ | |\n", "| approx_kl | 0.006209428 |\n", "| clip_fraction | 0.0667 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.804 |\n", "| explained_variance | 0.9793832 |\n", "| learning_rate | 0.0003 |\n", "| loss | 4.3 |\n", "| n_updates | 3340 |\n", "| policy_gradient_loss | -0.00356 |\n", "| value_loss | 8.38 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 461 |\n", "| ep_rew_mean | 204 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 837 |\n", "| time_elapsed | 1495 |\n", "| total_timesteps | 857088 |\n", "| train/ | |\n", "| approx_kl | 0.0040859734 |\n", "| clip_fraction | 0.0286 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.707 |\n", "| explained_variance | 0.9716868 |\n", "| learning_rate | 0.0003 |\n", "| loss | 3.95 |\n", "| n_updates | 3344 |\n", "| policy_gradient_loss | -0.00152 |\n", "| value_loss | 12.3 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 464 |\n", "| ep_rew_mean | 206 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 838 |\n", "| time_elapsed | 1496 |\n", "| total_timesteps | 858112 |\n", "| train/ | |\n", "| approx_kl | 0.0032926532 |\n", "| clip_fraction | 0.03 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.778 |\n", "| explained_variance | 0.9825648 |\n", "| learning_rate | 0.0003 |\n", "| loss | 3.85 |\n", "| n_updates | 3348 |\n", "| policy_gradient_loss | -0.00254 |\n", "| value_loss | 9.3 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 465 |\n", "| ep_rew_mean | 206 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 839 |\n", "| time_elapsed | 1498 |\n", "| total_timesteps | 859136 |\n", "| train/ | |\n", "| approx_kl | 0.0033243245 |\n", "| clip_fraction | 0.0205 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.747 |\n", "| explained_variance | 0.96907705 |\n", "| learning_rate | 0.0003 |\n", "| loss | 7.8 |\n", "| n_updates | 3352 |\n", "| policy_gradient_loss | -0.00297 |\n", "| value_loss | 21 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 465 |\n", "| ep_rew_mean | 206 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 840 |\n", "| time_elapsed | 1500 |\n", "| total_timesteps | 860160 |\n", "| train/ | |\n", "| approx_kl | 0.0043827207 |\n", "| clip_fraction | 0.0168 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.825 |\n", "| explained_variance | 0.9849644 |\n", "| learning_rate | 0.0003 |\n", "| loss | 1.97 |\n", "| n_updates | 3356 |\n", "| policy_gradient_loss | -0.000236 |\n", "| value_loss | 6.36 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 465 |\n", "| ep_rew_mean | 208 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 841 |\n", "| time_elapsed | 1502 |\n", "| total_timesteps | 861184 |\n", "| train/ | |\n", "| approx_kl | 0.0017283438 |\n", "| clip_fraction | 0.0151 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.746 |\n", "| explained_variance | 0.98362017 |\n", "| learning_rate | 0.0003 |\n", "| loss | 4.82 |\n", "| n_updates | 3360 |\n", "| policy_gradient_loss | -0.00135 |\n", "| value_loss | 11.3 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 465 |\n", "| ep_rew_mean | 208 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 842 |\n", "| time_elapsed | 1504 |\n", "| total_timesteps | 862208 |\n", "| train/ | |\n", "| approx_kl | 0.0039550196 |\n", "| clip_fraction | 0.0327 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.738 |\n", "| explained_variance | 0.98281026 |\n", "| learning_rate | 0.0003 |\n", "| loss | 5.04 |\n", "| n_updates | 3364 |\n", "| policy_gradient_loss | -0.00314 |\n", "| value_loss | 9.43 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 466 |\n", "| ep_rew_mean | 208 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 843 |\n", "| time_elapsed | 1505 |\n", "| total_timesteps | 863232 |\n", "| train/ | |\n", "| approx_kl | 0.0044392804 |\n", "| clip_fraction | 0.0239 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.773 |\n", "| explained_variance | 0.9898201 |\n", "| learning_rate | 0.0003 |\n", "| loss | 1.54 |\n", "| n_updates | 3368 |\n", "| policy_gradient_loss | -0.00191 |\n", "| value_loss | 4.4 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 465 |\n", "| ep_rew_mean | 205 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 844 |\n", "| time_elapsed | 1507 |\n", "| total_timesteps | 864256 |\n", "| train/ | |\n", "| approx_kl | 0.0073433556 |\n", "| clip_fraction | 0.0857 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.753 |\n", "| explained_variance | 0.98584706 |\n", "| learning_rate | 0.0003 |\n", "| loss | 4.5 |\n", "| n_updates | 3372 |\n", "| policy_gradient_loss | -0.00455 |\n", "| value_loss | 8.66 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 464 |\n", "| ep_rew_mean | 205 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 845 |\n", "| time_elapsed | 1509 |\n", "| total_timesteps | 865280 |\n", "| train/ | |\n", "| approx_kl | 0.0054736813 |\n", "| clip_fraction | 0.0632 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.839 |\n", "| explained_variance | 0.47511017 |\n", "| learning_rate | 0.0003 |\n", "| loss | 488 |\n", "| n_updates | 3376 |\n", "| policy_gradient_loss | 0.00289 |\n", "| value_loss | 923 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 467 |\n", "| ep_rew_mean | 203 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 846 |\n", "| time_elapsed | 1511 |\n", "| total_timesteps | 866304 |\n", "| train/ | |\n", "| approx_kl | 0.0024986085 |\n", "| clip_fraction | 0.00806 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.616 |\n", "| explained_variance | 0.9536722 |\n", "| learning_rate | 0.0003 |\n", "| loss | 8.74 |\n", "| n_updates | 3380 |\n", "| policy_gradient_loss | -0.00419 |\n", "| value_loss | 25.6 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 473 |\n", "| ep_rew_mean | 202 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 847 |\n", "| time_elapsed | 1513 |\n", "| total_timesteps | 867328 |\n", "| train/ | |\n", "| approx_kl | 0.0009563471 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.808 |\n", "| explained_variance | 0.5712812 |\n", "| learning_rate | 0.0003 |\n", "| loss | 310 |\n", "| n_updates | 3384 |\n", "| policy_gradient_loss | -0.00211 |\n", "| value_loss | 909 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 465 |\n", "| ep_rew_mean | 204 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 848 |\n", "| time_elapsed | 1515 |\n", "| total_timesteps | 868352 |\n", "| train/ | |\n", "| approx_kl | 0.010084745 |\n", "| clip_fraction | 0.0293 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.662 |\n", "| explained_variance | 0.98822254 |\n", "| learning_rate | 0.0003 |\n", "| loss | 3.06 |\n", "| n_updates | 3388 |\n", "| policy_gradient_loss | -0.00141 |\n", "| value_loss | 6.36 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 467 |\n", "| ep_rew_mean | 209 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 849 |\n", "| time_elapsed | 1516 |\n", "| total_timesteps | 869376 |\n", "| train/ | |\n", "| approx_kl | 0.0071091414 |\n", "| clip_fraction | 0.0286 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.743 |\n", "| explained_variance | 0.9325491 |\n", "| learning_rate | 0.0003 |\n", "| loss | 5.78 |\n", "| n_updates | 3392 |\n", "| policy_gradient_loss | 2.42e-05 |\n", "| value_loss | 18.9 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 470 |\n", "| ep_rew_mean | 210 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 850 |\n", "| time_elapsed | 1518 |\n", "| total_timesteps | 870400 |\n", "| train/ | |\n", "| approx_kl | 0.004442379 |\n", "| clip_fraction | 0.0276 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.717 |\n", "| explained_variance | 0.97349274 |\n", "| learning_rate | 0.0003 |\n", "| loss | 9.69 |\n", "| n_updates | 3396 |\n", "| policy_gradient_loss | -0.00271 |\n", "| value_loss | 20.2 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 469 |\n", "| ep_rew_mean | 210 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 851 |\n", "| time_elapsed | 1520 |\n", "| total_timesteps | 871424 |\n", "| train/ | |\n", "| approx_kl | 0.0057218047 |\n", "| clip_fraction | 0.0181 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.75 |\n", "| explained_variance | 0.97339994 |\n", "| learning_rate | 0.0003 |\n", "| loss | 6.42 |\n", "| n_updates | 3400 |\n", "| policy_gradient_loss | -0.00232 |\n", "| value_loss | 12.8 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 471 |\n", "| ep_rew_mean | 214 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 852 |\n", "| time_elapsed | 1521 |\n", "| total_timesteps | 872448 |\n", "| train/ | |\n", "| approx_kl | 0.0043360097 |\n", "| clip_fraction | 0.0427 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.833 |\n", "| explained_variance | 0.9459022 |\n", "| learning_rate | 0.0003 |\n", "| loss | 11.1 |\n", "| n_updates | 3404 |\n", "| policy_gradient_loss | -0.00195 |\n", "| value_loss | 12.4 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 465 |\n", "| ep_rew_mean | 215 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 853 |\n", "| time_elapsed | 1523 |\n", "| total_timesteps | 873472 |\n", "| train/ | |\n", "| approx_kl | 0.0038297684 |\n", "| clip_fraction | 0.019 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.687 |\n", "| explained_variance | 0.97493154 |\n", "| learning_rate | 0.0003 |\n", "| loss | 3.55 |\n", "| n_updates | 3408 |\n", "| policy_gradient_loss | -0.00278 |\n", "| value_loss | 14.8 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 458 |\n", "| ep_rew_mean | 218 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 854 |\n", "| time_elapsed | 1525 |\n", "| total_timesteps | 874496 |\n", "| train/ | |\n", "| approx_kl | 0.0027273647 |\n", "| clip_fraction | 0.00977 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.783 |\n", "| explained_variance | 0.9552442 |\n", "| learning_rate | 0.0003 |\n", "| loss | 9.24 |\n", "| n_updates | 3412 |\n", "| policy_gradient_loss | -0.00115 |\n", "| value_loss | 25.8 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 457 |\n", "| ep_rew_mean | 218 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 855 |\n", "| time_elapsed | 1527 |\n", "| total_timesteps | 875520 |\n", "| train/ | |\n", "| approx_kl | 0.0017827622 |\n", "| clip_fraction | 0.00732 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.726 |\n", "| explained_variance | 0.9755817 |\n", "| learning_rate | 0.0003 |\n", "| loss | 5.29 |\n", "| n_updates | 3416 |\n", "| policy_gradient_loss | -0.000711 |\n", "| value_loss | 16.5 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 458 |\n", "| ep_rew_mean | 220 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 856 |\n", "| time_elapsed | 1529 |\n", "| total_timesteps | 876544 |\n", "| train/ | |\n", "| approx_kl | 0.0013855502 |\n", "| clip_fraction | 0.00342 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.721 |\n", "| explained_variance | 0.41485804 |\n", "| learning_rate | 0.0003 |\n", "| loss | 624 |\n", "| n_updates | 3420 |\n", "| policy_gradient_loss | -0.000695 |\n", "| value_loss | 1.01e+03 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 465 |\n", "| ep_rew_mean | 222 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 857 |\n", "| time_elapsed | 1530 |\n", "| total_timesteps | 877568 |\n", "| train/ | |\n", "| approx_kl | 0.001300647 |\n", "| clip_fraction | 0.0022 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.751 |\n", "| explained_variance | 0.9576344 |\n", "| learning_rate | 0.0003 |\n", "| loss | 15.6 |\n", "| n_updates | 3424 |\n", "| policy_gradient_loss | -0.00134 |\n", "| value_loss | 39.8 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 463 |\n", "| ep_rew_mean | 221 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 858 |\n", "| time_elapsed | 1532 |\n", "| total_timesteps | 878592 |\n", "| train/ | |\n", "| approx_kl | 0.0045768805 |\n", "| clip_fraction | 0.0332 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.726 |\n", "| explained_variance | 0.9945018 |\n", "| learning_rate | 0.0003 |\n", "| loss | 1.37 |\n", "| n_updates | 3428 |\n", "| policy_gradient_loss | -0.00118 |\n", "| value_loss | 4.17 |\n", "------------------------------------------\n", "----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 461 |\n", "| ep_rew_mean | 219 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 859 |\n", "| time_elapsed | 1534 |\n", "| total_timesteps | 879616 |\n", "| train/ | |\n", "| approx_kl | 0.00398943 |\n", "| clip_fraction | 0.0444 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.697 |\n", "| explained_variance | 0.98970187 |\n", "| learning_rate | 0.0003 |\n", "| loss | 1.57 |\n", "| n_updates | 3432 |\n", "| policy_gradient_loss | -0.00172 |\n", "| value_loss | 5.6 |\n", "----------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 459 |\n", "| ep_rew_mean | 221 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 860 |\n", "| time_elapsed | 1535 |\n", "| total_timesteps | 880640 |\n", "| train/ | |\n", "| approx_kl | 0.001723927 |\n", "| clip_fraction | 0.0061 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.836 |\n", "| explained_variance | 0.4143275 |\n", "| learning_rate | 0.0003 |\n", "| loss | 251 |\n", "| n_updates | 3436 |\n", "| policy_gradient_loss | -0.000468 |\n", "| value_loss | 1.01e+03 |\n", "-----------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 459 |\n", "| ep_rew_mean | 224 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 861 |\n", "| time_elapsed | 1537 |\n", "| total_timesteps | 881664 |\n", "| train/ | |\n", "| approx_kl | 0.00011460652 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.764 |\n", "| explained_variance | 0.51780725 |\n", "| learning_rate | 0.0003 |\n", "| loss | 584 |\n", "| n_updates | 3440 |\n", "| policy_gradient_loss | -0.000212 |\n", "| value_loss | 862 |\n", "-------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 457 |\n", "| ep_rew_mean | 224 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 862 |\n", "| time_elapsed | 1539 |\n", "| total_timesteps | 882688 |\n", "| train/ | |\n", "| approx_kl | 0.005809918 |\n", "| clip_fraction | 0.0515 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.791 |\n", "| explained_variance | 0.98725134 |\n", "| learning_rate | 0.0003 |\n", "| loss | 3.08 |\n", "| n_updates | 3444 |\n", "| policy_gradient_loss | -0.00304 |\n", "| value_loss | 7.11 |\n", "-----------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 455 |\n", "| ep_rew_mean | 223 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 863 |\n", "| time_elapsed | 1541 |\n", "| total_timesteps | 883712 |\n", "| train/ | |\n", "| approx_kl | 0.007936319 |\n", "| clip_fraction | 0.0781 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.751 |\n", "| explained_variance | 0.9762511 |\n", "| learning_rate | 0.0003 |\n", "| loss | 1.97 |\n", "| n_updates | 3448 |\n", "| policy_gradient_loss | -0.00455 |\n", "| value_loss | 8.9 |\n", "-----------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 455 |\n", "| ep_rew_mean | 223 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 864 |\n", "| time_elapsed | 1543 |\n", "| total_timesteps | 884736 |\n", "| train/ | |\n", "| approx_kl | 0.006779057 |\n", "| clip_fraction | 0.083 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.76 |\n", "| explained_variance | 0.43166476 |\n", "| learning_rate | 0.0003 |\n", "| loss | 850 |\n", "| n_updates | 3452 |\n", "| policy_gradient_loss | -0.00039 |\n", "| value_loss | 926 |\n", "-----------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 452 |\n", "| ep_rew_mean | 223 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 865 |\n", "| time_elapsed | 1544 |\n", "| total_timesteps | 885760 |\n", "| train/ | |\n", "| approx_kl | 0.007929431 |\n", "| clip_fraction | 0.0603 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.796 |\n", "| explained_variance | 0.97070503 |\n", "| learning_rate | 0.0003 |\n", "| loss | 6.17 |\n", "| n_updates | 3456 |\n", "| policy_gradient_loss | -0.00372 |\n", "| value_loss | 15.2 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 452 |\n", "| ep_rew_mean | 226 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 866 |\n", "| time_elapsed | 1546 |\n", "| total_timesteps | 886784 |\n", "| train/ | |\n", "| approx_kl | 0.0017856082 |\n", "| clip_fraction | 0.00464 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.638 |\n", "| explained_variance | 0.9492958 |\n", "| learning_rate | 0.0003 |\n", "| loss | 6.1 |\n", "| n_updates | 3460 |\n", "| policy_gradient_loss | -0.000968 |\n", "| value_loss | 26.8 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 445 |\n", "| ep_rew_mean | 228 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 867 |\n", "| time_elapsed | 1548 |\n", "| total_timesteps | 887808 |\n", "| train/ | |\n", "| approx_kl | 0.003587621 |\n", "| clip_fraction | 0.0405 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.784 |\n", "| explained_variance | 0.9623703 |\n", "| learning_rate | 0.0003 |\n", "| loss | 5.41 |\n", "| n_updates | 3464 |\n", "| policy_gradient_loss | -0.00411 |\n", "| value_loss | 18.5 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 441 |\n", "| ep_rew_mean | 225 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 868 |\n", "| time_elapsed | 1550 |\n", "| total_timesteps | 888832 |\n", "| train/ | |\n", "| approx_kl | 0.0029214344 |\n", "| clip_fraction | 0.00781 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.74 |\n", "| explained_variance | 0.93390846 |\n", "| learning_rate | 0.0003 |\n", "| loss | 4.72 |\n", "| n_updates | 3468 |\n", "| policy_gradient_loss | -0.003 |\n", "| value_loss | 25.8 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 441 |\n", "| ep_rew_mean | 223 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 869 |\n", "| time_elapsed | 1552 |\n", "| total_timesteps | 889856 |\n", "| train/ | |\n", "| approx_kl | 0.0029549468 |\n", "| clip_fraction | 0.0146 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.748 |\n", "| explained_variance | 0.55921006 |\n", "| learning_rate | 0.0003 |\n", "| loss | 93.5 |\n", "| n_updates | 3472 |\n", "| policy_gradient_loss | 0.00125 |\n", "| value_loss | 781 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 446 |\n", "| ep_rew_mean | 221 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 870 |\n", "| time_elapsed | 1553 |\n", "| total_timesteps | 890880 |\n", "| train/ | |\n", "| approx_kl | 6.223383e-05 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.639 |\n", "| explained_variance | 0.5726714 |\n", "| learning_rate | 0.0003 |\n", "| loss | 307 |\n", "| n_updates | 3476 |\n", "| policy_gradient_loss | -5.83e-05 |\n", "| value_loss | 763 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 444 |\n", "| ep_rew_mean | 221 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 871 |\n", "| time_elapsed | 1555 |\n", "| total_timesteps | 891904 |\n", "| train/ | |\n", "| approx_kl | 0.008895343 |\n", "| clip_fraction | 0.0908 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.711 |\n", "| explained_variance | 0.97896516 |\n", "| learning_rate | 0.0003 |\n", "| loss | 1.55 |\n", "| n_updates | 3480 |\n", "| policy_gradient_loss | -0.00568 |\n", "| value_loss | 11.5 |\n", "-----------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 447 |\n", "| ep_rew_mean | 222 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 872 |\n", "| time_elapsed | 1557 |\n", "| total_timesteps | 892928 |\n", "| train/ | |\n", "| approx_kl | 0.006091318 |\n", "| clip_fraction | 0.0781 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.779 |\n", "| explained_variance | 0.9273951 |\n", "| learning_rate | 0.0003 |\n", "| loss | 26.6 |\n", "| n_updates | 3484 |\n", "| policy_gradient_loss | -0.00463 |\n", "| value_loss | 41.3 |\n", "-----------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 446 |\n", "| ep_rew_mean | 222 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 873 |\n", "| time_elapsed | 1558 |\n", "| total_timesteps | 893952 |\n", "| train/ | |\n", "| approx_kl | 0.003748555 |\n", "| clip_fraction | 0.0186 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.638 |\n", "| explained_variance | 0.9726877 |\n", "| learning_rate | 0.0003 |\n", "| loss | 4.54 |\n", "| n_updates | 3488 |\n", "| policy_gradient_loss | 0.00139 |\n", "| value_loss | 15.2 |\n", "-----------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 444 |\n", "| ep_rew_mean | 222 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 874 |\n", "| time_elapsed | 1560 |\n", "| total_timesteps | 894976 |\n", "| train/ | |\n", "| approx_kl | 0.012988065 |\n", "| clip_fraction | 0.0715 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.794 |\n", "| explained_variance | 0.95748454 |\n", "| learning_rate | 0.0003 |\n", "| loss | 5.43 |\n", "| n_updates | 3492 |\n", "| policy_gradient_loss | -0.00402 |\n", "| value_loss | 17.3 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 435 |\n", "| ep_rew_mean | 223 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 875 |\n", "| time_elapsed | 1562 |\n", "| total_timesteps | 896000 |\n", "| train/ | |\n", "| approx_kl | 0.0023541641 |\n", "| clip_fraction | 0.00513 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.726 |\n", "| explained_variance | 0.97648793 |\n", "| learning_rate | 0.0003 |\n", "| loss | 5.32 |\n", "| n_updates | 3496 |\n", "| policy_gradient_loss | -0.00377 |\n", "| value_loss | 13.3 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 431 |\n", "| ep_rew_mean | 221 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 876 |\n", "| time_elapsed | 1564 |\n", "| total_timesteps | 897024 |\n", "| train/ | |\n", "| approx_kl | 0.0045425966 |\n", "| clip_fraction | 0.0437 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.76 |\n", "| explained_variance | 0.9737478 |\n", "| learning_rate | 0.0003 |\n", "| loss | 7.11 |\n", "| n_updates | 3500 |\n", "| policy_gradient_loss | -0.00181 |\n", "| value_loss | 14.8 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 426 |\n", "| ep_rew_mean | 221 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 877 |\n", "| time_elapsed | 1566 |\n", "| total_timesteps | 898048 |\n", "| train/ | |\n", "| approx_kl | 0.0012864543 |\n", "| clip_fraction | 0.000732 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.828 |\n", "| explained_variance | 0.41175282 |\n", "| learning_rate | 0.0003 |\n", "| loss | 556 |\n", "| n_updates | 3504 |\n", "| policy_gradient_loss | -2.21e-05 |\n", "| value_loss | 929 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 431 |\n", "| ep_rew_mean | 220 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 878 |\n", "| time_elapsed | 1567 |\n", "| total_timesteps | 899072 |\n", "| train/ | |\n", "| approx_kl | 0.0017538816 |\n", "| clip_fraction | 0.00293 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.764 |\n", "| explained_variance | 0.9179718 |\n", "| learning_rate | 0.0003 |\n", "| loss | 10.2 |\n", "| n_updates | 3508 |\n", "| policy_gradient_loss | -0.000635 |\n", "| value_loss | 35.7 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 430 |\n", "| ep_rew_mean | 220 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 879 |\n", "| time_elapsed | 1569 |\n", "| total_timesteps | 900096 |\n", "| train/ | |\n", "| approx_kl | 0.007984748 |\n", "| clip_fraction | 0.0442 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.692 |\n", "| explained_variance | 0.98170435 |\n", "| learning_rate | 0.0003 |\n", "| loss | 3.15 |\n", "| n_updates | 3512 |\n", "| policy_gradient_loss | -0.00289 |\n", "| value_loss | 15.9 |\n", "-----------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 426 |\n", "| ep_rew_mean | 217 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 880 |\n", "| time_elapsed | 1571 |\n", "| total_timesteps | 901120 |\n", "| train/ | |\n", "| approx_kl | 0.004323054 |\n", "| clip_fraction | 0.0266 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.679 |\n", "| explained_variance | 0.96854734 |\n", "| learning_rate | 0.0003 |\n", "| loss | 11.2 |\n", "| n_updates | 3516 |\n", "| policy_gradient_loss | -0.00429 |\n", "| value_loss | 24.1 |\n", "-----------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 423 |\n", "| ep_rew_mean | 212 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 881 |\n", "| time_elapsed | 1572 |\n", "| total_timesteps | 902144 |\n", "| train/ | |\n", "| approx_kl | 9.32517e-05 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.753 |\n", "| explained_variance | 0.44401038 |\n", "| learning_rate | 0.0003 |\n", "| loss | 120 |\n", "| n_updates | 3520 |\n", "| policy_gradient_loss | 0.000465 |\n", "| value_loss | 952 |\n", "-----------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 422 |\n", "| ep_rew_mean | 212 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 882 |\n", "| time_elapsed | 1574 |\n", "| total_timesteps | 903168 |\n", "| train/ | |\n", "| approx_kl | 0.00011415267 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.804 |\n", "| explained_variance | 0.6974262 |\n", "| learning_rate | 0.0003 |\n", "| loss | 600 |\n", "| n_updates | 3524 |\n", "| policy_gradient_loss | -0.000406 |\n", "| value_loss | 1.33e+03 |\n", "-------------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 420 |\n", "| ep_rew_mean | 213 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 883 |\n", "| time_elapsed | 1576 |\n", "| total_timesteps | 904192 |\n", "| train/ | |\n", "| approx_kl | 0.00019792694 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.683 |\n", "| explained_variance | 0.75329125 |\n", "| learning_rate | 0.0003 |\n", "| loss | 15.8 |\n", "| n_updates | 3528 |\n", "| policy_gradient_loss | -0.00037 |\n", "| value_loss | 162 |\n", "-------------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 418 |\n", "| ep_rew_mean | 213 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 884 |\n", "| time_elapsed | 1578 |\n", "| total_timesteps | 905216 |\n", "| train/ | |\n", "| approx_kl | 0.00035233446 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.712 |\n", "| explained_variance | 0.8552117 |\n", "| learning_rate | 0.0003 |\n", "| loss | 23.6 |\n", "| n_updates | 3532 |\n", "| policy_gradient_loss | -0.000142 |\n", "| value_loss | 82.1 |\n", "-------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 421 |\n", "| ep_rew_mean | 215 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 885 |\n", "| time_elapsed | 1580 |\n", "| total_timesteps | 906240 |\n", "| train/ | |\n", "| approx_kl | 0.0053853677 |\n", "| clip_fraction | 0.0566 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.755 |\n", "| explained_variance | 0.8885267 |\n", "| learning_rate | 0.0003 |\n", "| loss | 14.5 |\n", "| n_updates | 3536 |\n", "| policy_gradient_loss | -0.00702 |\n", "| value_loss | 35.2 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 416 |\n", "| ep_rew_mean | 217 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 886 |\n", "| time_elapsed | 1581 |\n", "| total_timesteps | 907264 |\n", "| train/ | |\n", "| approx_kl | 0.0049076686 |\n", "| clip_fraction | 0.0474 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.677 |\n", "| explained_variance | 0.92746615 |\n", "| learning_rate | 0.0003 |\n", "| loss | 10.3 |\n", "| n_updates | 3540 |\n", "| policy_gradient_loss | -0.00393 |\n", "| value_loss | 21.1 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 423 |\n", "| ep_rew_mean | 218 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 887 |\n", "| time_elapsed | 1583 |\n", "| total_timesteps | 908288 |\n", "| train/ | |\n", "| approx_kl | 0.0025728666 |\n", "| clip_fraction | 0.00757 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.675 |\n", "| explained_variance | 0.96330124 |\n", "| learning_rate | 0.0003 |\n", "| loss | 7.42 |\n", "| n_updates | 3544 |\n", "| policy_gradient_loss | -0.00137 |\n", "| value_loss | 22.2 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 415 |\n", "| ep_rew_mean | 216 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 888 |\n", "| time_elapsed | 1585 |\n", "| total_timesteps | 909312 |\n", "| train/ | |\n", "| approx_kl | 0.025034787 |\n", "| clip_fraction | 0.0615 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.706 |\n", "| explained_variance | 0.9752804 |\n", "| learning_rate | 0.0003 |\n", "| loss | 2.49 |\n", "| n_updates | 3548 |\n", "| policy_gradient_loss | -0.000454 |\n", "| value_loss | 7.04 |\n", "-----------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 408 |\n", "| ep_rew_mean | 210 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 889 |\n", "| time_elapsed | 1587 |\n", "| total_timesteps | 910336 |\n", "| train/ | |\n", "| approx_kl | 0.017769814 |\n", "| clip_fraction | 0.256 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.846 |\n", "| explained_variance | 0.48640817 |\n", "| learning_rate | 0.0003 |\n", "| loss | 224 |\n", "| n_updates | 3552 |\n", "| policy_gradient_loss | 0.00955 |\n", "| value_loss | 888 |\n", "-----------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 409 |\n", "| ep_rew_mean | 211 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 890 |\n", "| time_elapsed | 1588 |\n", "| total_timesteps | 911360 |\n", "| train/ | |\n", "| approx_kl | 0.00019348948 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.78 |\n", "| explained_variance | 0.51285857 |\n", "| learning_rate | 0.0003 |\n", "| loss | 967 |\n", "| n_updates | 3556 |\n", "| policy_gradient_loss | 8.37e-05 |\n", "| value_loss | 2.15e+03 |\n", "-------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 407 |\n", "| ep_rew_mean | 209 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 891 |\n", "| time_elapsed | 1590 |\n", "| total_timesteps | 912384 |\n", "| train/ | |\n", "| approx_kl | 0.0018703187 |\n", "| clip_fraction | 0.00244 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.671 |\n", "| explained_variance | 0.9595897 |\n", "| learning_rate | 0.0003 |\n", "| loss | 9.97 |\n", "| n_updates | 3560 |\n", "| policy_gradient_loss | -0.000684 |\n", "| value_loss | 41.1 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 410 |\n", "| ep_rew_mean | 209 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 892 |\n", "| time_elapsed | 1592 |\n", "| total_timesteps | 913408 |\n", "| train/ | |\n", "| approx_kl | 0.0012369531 |\n", "| clip_fraction | 0.00146 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.723 |\n", "| explained_variance | 0.6069588 |\n", "| learning_rate | 0.0003 |\n", "| loss | 362 |\n", "| n_updates | 3564 |\n", "| policy_gradient_loss | -0.00162 |\n", "| value_loss | 634 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 410 |\n", "| ep_rew_mean | 209 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 893 |\n", "| time_elapsed | 1594 |\n", "| total_timesteps | 914432 |\n", "| train/ | |\n", "| approx_kl | 0.0008263005 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.644 |\n", "| explained_variance | 0.9673849 |\n", "| learning_rate | 0.0003 |\n", "| loss | 7.35 |\n", "| n_updates | 3568 |\n", "| policy_gradient_loss | -0.000245 |\n", "| value_loss | 23.9 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 409 |\n", "| ep_rew_mean | 208 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 894 |\n", "| time_elapsed | 1595 |\n", "| total_timesteps | 915456 |\n", "| train/ | |\n", "| approx_kl | 0.0032144957 |\n", "| clip_fraction | 0.0322 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.801 |\n", "| explained_variance | 0.9862846 |\n", "| learning_rate | 0.0003 |\n", "| loss | 2.95 |\n", "| n_updates | 3572 |\n", "| policy_gradient_loss | -0.00323 |\n", "| value_loss | 7.74 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 408 |\n", "| ep_rew_mean | 210 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 895 |\n", "| time_elapsed | 1597 |\n", "| total_timesteps | 916480 |\n", "| train/ | |\n", "| approx_kl | 0.0076351035 |\n", "| clip_fraction | 0.0483 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.754 |\n", "| explained_variance | 0.9543234 |\n", "| learning_rate | 0.0003 |\n", "| loss | 2.96 |\n", "| n_updates | 3576 |\n", "| policy_gradient_loss | -0.00216 |\n", "| value_loss | 20.4 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 400 |\n", "| ep_rew_mean | 212 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 896 |\n", "| time_elapsed | 1599 |\n", "| total_timesteps | 917504 |\n", "| train/ | |\n", "| approx_kl | 0.002502129 |\n", "| clip_fraction | 0.0144 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.654 |\n", "| explained_variance | 0.9595576 |\n", "| learning_rate | 0.0003 |\n", "| loss | 6.55 |\n", "| n_updates | 3580 |\n", "| policy_gradient_loss | -0.000574 |\n", "| value_loss | 26.8 |\n", "-----------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 399 |\n", "| ep_rew_mean | 212 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 897 |\n", "| time_elapsed | 1601 |\n", "| total_timesteps | 918528 |\n", "| train/ | |\n", "| approx_kl | 0.004939488 |\n", "| clip_fraction | 0.0186 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.724 |\n", "| explained_variance | 0.9651925 |\n", "| learning_rate | 0.0003 |\n", "| loss | 4.16 |\n", "| n_updates | 3584 |\n", "| policy_gradient_loss | -0.000394 |\n", "| value_loss | 18.3 |\n", "-----------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 398 |\n", "| ep_rew_mean | 214 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 898 |\n", "| time_elapsed | 1602 |\n", "| total_timesteps | 919552 |\n", "| train/ | |\n", "| approx_kl | 0.007160233 |\n", "| clip_fraction | 0.0386 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.712 |\n", "| explained_variance | 0.9878967 |\n", "| learning_rate | 0.0003 |\n", "| loss | 2.39 |\n", "| n_updates | 3588 |\n", "| policy_gradient_loss | -0.00157 |\n", "| value_loss | 6.97 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 399 |\n", "| ep_rew_mean | 214 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 899 |\n", "| time_elapsed | 1604 |\n", "| total_timesteps | 920576 |\n", "| train/ | |\n", "| approx_kl | 0.0083335545 |\n", "| clip_fraction | 0.0647 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.774 |\n", "| explained_variance | 0.9869501 |\n", "| learning_rate | 0.0003 |\n", "| loss | 2.37 |\n", "| n_updates | 3592 |\n", "| policy_gradient_loss | -0.00117 |\n", "| value_loss | 7.58 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 397 |\n", "| ep_rew_mean | 214 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 900 |\n", "| time_elapsed | 1606 |\n", "| total_timesteps | 921600 |\n", "| train/ | |\n", "| approx_kl | 0.009418115 |\n", "| clip_fraction | 0.11 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.672 |\n", "| explained_variance | 0.5288789 |\n", "| learning_rate | 0.0003 |\n", "| loss | 117 |\n", "| n_updates | 3596 |\n", "| policy_gradient_loss | -0.00178 |\n", "| value_loss | 926 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 397 |\n", "| ep_rew_mean | 214 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 901 |\n", "| time_elapsed | 1607 |\n", "| total_timesteps | 922624 |\n", "| train/ | |\n", "| approx_kl | 0.0065078842 |\n", "| clip_fraction | 0.0698 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.737 |\n", "| explained_variance | 0.97894824 |\n", "| learning_rate | 0.0003 |\n", "| loss | 3.98 |\n", "| n_updates | 3600 |\n", "| policy_gradient_loss | -0.00639 |\n", "| value_loss | 15.7 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 396 |\n", "| ep_rew_mean | 217 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 902 |\n", "| time_elapsed | 1610 |\n", "| total_timesteps | 923648 |\n", "| train/ | |\n", "| approx_kl | 0.0036689015 |\n", "| clip_fraction | 0.0332 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.68 |\n", "| explained_variance | 0.9876458 |\n", "| learning_rate | 0.0003 |\n", "| loss | 2.03 |\n", "| n_updates | 3604 |\n", "| policy_gradient_loss | -0.00133 |\n", "| value_loss | 7.58 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 393 |\n", "| ep_rew_mean | 212 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 903 |\n", "| time_elapsed | 1611 |\n", "| total_timesteps | 924672 |\n", "| train/ | |\n", "| approx_kl | 0.004814436 |\n", "| clip_fraction | 0.0332 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.76 |\n", "| explained_variance | 0.9904206 |\n", "| learning_rate | 0.0003 |\n", "| loss | 1.49 |\n", "| n_updates | 3608 |\n", "| policy_gradient_loss | 0.000294 |\n", "| value_loss | 5.36 |\n", "-----------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 392 |\n", "| ep_rew_mean | 212 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 904 |\n", "| time_elapsed | 1613 |\n", "| total_timesteps | 925696 |\n", "| train/ | |\n", "| approx_kl | 0.004355767 |\n", "| clip_fraction | 0.04 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.736 |\n", "| explained_variance | 0.48434228 |\n", "| learning_rate | 0.0003 |\n", "| loss | 883 |\n", "| n_updates | 3612 |\n", "| policy_gradient_loss | 9.95e-05 |\n", "| value_loss | 1.91e+03 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 390 |\n", "| ep_rew_mean | 210 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 905 |\n", "| time_elapsed | 1615 |\n", "| total_timesteps | 926720 |\n", "| train/ | |\n", "| approx_kl | 0.0034587334 |\n", "| clip_fraction | 0.0137 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.703 |\n", "| explained_variance | 0.971204 |\n", "| learning_rate | 0.0003 |\n", "| loss | 6.92 |\n", "| n_updates | 3616 |\n", "| policy_gradient_loss | -0.00394 |\n", "| value_loss | 16.9 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 390 |\n", "| ep_rew_mean | 210 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 906 |\n", "| time_elapsed | 1616 |\n", "| total_timesteps | 927744 |\n", "| train/ | |\n", "| approx_kl | 0.0018663397 |\n", "| clip_fraction | 0.000977 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.7 |\n", "| explained_variance | 0.67144084 |\n", "| learning_rate | 0.0003 |\n", "| loss | 119 |\n", "| n_updates | 3620 |\n", "| policy_gradient_loss | -0.00366 |\n", "| value_loss | 634 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 389 |\n", "| ep_rew_mean | 213 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 907 |\n", "| time_elapsed | 1618 |\n", "| total_timesteps | 928768 |\n", "| train/ | |\n", "| approx_kl | 0.0014073197 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.79 |\n", "| explained_variance | 0.59385705 |\n", "| learning_rate | 0.0003 |\n", "| loss | 213 |\n", "| n_updates | 3624 |\n", "| policy_gradient_loss | -0.00255 |\n", "| value_loss | 845 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 389 |\n", "| ep_rew_mean | 214 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 908 |\n", "| time_elapsed | 1620 |\n", "| total_timesteps | 929792 |\n", "| train/ | |\n", "| approx_kl | 0.005460643 |\n", "| clip_fraction | 0.0352 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.818 |\n", "| explained_variance | 0.9594423 |\n", "| learning_rate | 0.0003 |\n", "| loss | 3.45 |\n", "| n_updates | 3628 |\n", "| policy_gradient_loss | -0.00252 |\n", "| value_loss | 19 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 388 |\n", "| ep_rew_mean | 214 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 909 |\n", "| time_elapsed | 1622 |\n", "| total_timesteps | 930816 |\n", "| train/ | |\n", "| approx_kl | 0.0026274282 |\n", "| clip_fraction | 0.0225 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.601 |\n", "| explained_variance | 0.8990368 |\n", "| learning_rate | 0.0003 |\n", "| loss | 4.97 |\n", "| n_updates | 3632 |\n", "| policy_gradient_loss | -0.00373 |\n", "| value_loss | 19.6 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 382 |\n", "| ep_rew_mean | 211 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 910 |\n", "| time_elapsed | 1624 |\n", "| total_timesteps | 931840 |\n", "| train/ | |\n", "| approx_kl | 0.0045581777 |\n", "| clip_fraction | 0.04 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.723 |\n", "| explained_variance | 0.978967 |\n", "| learning_rate | 0.0003 |\n", "| loss | 2.55 |\n", "| n_updates | 3636 |\n", "| policy_gradient_loss | -0.00251 |\n", "| value_loss | 10.9 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 380 |\n", "| ep_rew_mean | 207 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 911 |\n", "| time_elapsed | 1625 |\n", "| total_timesteps | 932864 |\n", "| train/ | |\n", "| approx_kl | 0.000404727 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.765 |\n", "| explained_variance | 0.55538464 |\n", "| learning_rate | 0.0003 |\n", "| loss | 265 |\n", "| n_updates | 3640 |\n", "| policy_gradient_loss | 0.000783 |\n", "| value_loss | 925 |\n", "-----------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 382 |\n", "| ep_rew_mean | 207 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 912 |\n", "| time_elapsed | 1627 |\n", "| total_timesteps | 933888 |\n", "| train/ | |\n", "| approx_kl | 1.1228723e-05 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.784 |\n", "| explained_variance | 0.5674583 |\n", "| learning_rate | 0.0003 |\n", "| loss | 680 |\n", "| n_updates | 3644 |\n", "| policy_gradient_loss | -8.59e-05 |\n", "| value_loss | 1.46e+03 |\n", "-------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 382 |\n", "| ep_rew_mean | 210 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 913 |\n", "| time_elapsed | 1629 |\n", "| total_timesteps | 934912 |\n", "| train/ | |\n", "| approx_kl | 0.0018602532 |\n", "| clip_fraction | 0.00366 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.645 |\n", "| explained_variance | 0.9404254 |\n", "| learning_rate | 0.0003 |\n", "| loss | 5.16 |\n", "| n_updates | 3648 |\n", "| policy_gradient_loss | -0.00126 |\n", "| value_loss | 49.5 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 381 |\n", "| ep_rew_mean | 208 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 914 |\n", "| time_elapsed | 1630 |\n", "| total_timesteps | 935936 |\n", "| train/ | |\n", "| approx_kl | 0.0052797575 |\n", "| clip_fraction | 0.031 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.717 |\n", "| explained_variance | 0.92424154 |\n", "| learning_rate | 0.0003 |\n", "| loss | 4.45 |\n", "| n_updates | 3652 |\n", "| policy_gradient_loss | -0.0035 |\n", "| value_loss | 27.3 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 375 |\n", "| ep_rew_mean | 209 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 915 |\n", "| time_elapsed | 1632 |\n", "| total_timesteps | 936960 |\n", "| train/ | |\n", "| approx_kl | 0.0069291773 |\n", "| clip_fraction | 0.115 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.782 |\n", "| explained_variance | 0.4600755 |\n", "| learning_rate | 0.0003 |\n", "| loss | 296 |\n", "| n_updates | 3656 |\n", "| policy_gradient_loss | 0.00148 |\n", "| value_loss | 940 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 372 |\n", "| ep_rew_mean | 208 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 916 |\n", "| time_elapsed | 1634 |\n", "| total_timesteps | 937984 |\n", "| train/ | |\n", "| approx_kl | 0.006445364 |\n", "| clip_fraction | 0.0493 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.772 |\n", "| explained_variance | 0.9778672 |\n", "| learning_rate | 0.0003 |\n", "| loss | 4.8 |\n", "| n_updates | 3660 |\n", "| policy_gradient_loss | -0.00386 |\n", "| value_loss | 16.6 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 371 |\n", "| ep_rew_mean | 206 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 917 |\n", "| time_elapsed | 1636 |\n", "| total_timesteps | 939008 |\n", "| train/ | |\n", "| approx_kl | 0.0018803207 |\n", "| clip_fraction | 0.0139 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.758 |\n", "| explained_variance | 0.4758013 |\n", "| learning_rate | 0.0003 |\n", "| loss | 251 |\n", "| n_updates | 3664 |\n", "| policy_gradient_loss | 0.000672 |\n", "| value_loss | 1.38e+03 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 378 |\n", "| ep_rew_mean | 208 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 918 |\n", "| time_elapsed | 1638 |\n", "| total_timesteps | 940032 |\n", "| train/ | |\n", "| approx_kl | 0.0002184799 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.725 |\n", "| explained_variance | 0.7346723 |\n", "| learning_rate | 0.0003 |\n", "| loss | 130 |\n", "| n_updates | 3668 |\n", "| policy_gradient_loss | -0.000365 |\n", "| value_loss | 598 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 376 |\n", "| ep_rew_mean | 208 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 919 |\n", "| time_elapsed | 1639 |\n", "| total_timesteps | 941056 |\n", "| train/ | |\n", "| approx_kl | 0.0007230598 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.752 |\n", "| explained_variance | 0.7070824 |\n", "| learning_rate | 0.0003 |\n", "| loss | 48.5 |\n", "| n_updates | 3672 |\n", "| policy_gradient_loss | -0.000889 |\n", "| value_loss | 825 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 376 |\n", "| ep_rew_mean | 206 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 920 |\n", "| time_elapsed | 1641 |\n", "| total_timesteps | 942080 |\n", "| train/ | |\n", "| approx_kl | 0.0025974447 |\n", "| clip_fraction | 0.0115 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.713 |\n", "| explained_variance | 0.9591151 |\n", "| learning_rate | 0.0003 |\n", "| loss | 4.42 |\n", "| n_updates | 3676 |\n", "| policy_gradient_loss | -0.00199 |\n", "| value_loss | 31.8 |\n", "------------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 372 |\n", "| ep_rew_mean | 203 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 921 |\n", "| time_elapsed | 1643 |\n", "| total_timesteps | 943104 |\n", "| train/ | |\n", "| approx_kl | 0.00050113397 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.739 |\n", "| explained_variance | 0.7674358 |\n", "| learning_rate | 0.0003 |\n", "| loss | 89.1 |\n", "| n_updates | 3680 |\n", "| policy_gradient_loss | -0.000268 |\n", "| value_loss | 433 |\n", "-------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 359 |\n", "| ep_rew_mean | 198 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 922 |\n", "| time_elapsed | 1645 |\n", "| total_timesteps | 944128 |\n", "| train/ | |\n", "| approx_kl | 0.0005919831 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.685 |\n", "| explained_variance | 0.83452344 |\n", "| learning_rate | 0.0003 |\n", "| loss | 164 |\n", "| n_updates | 3684 |\n", "| policy_gradient_loss | 5.41e-05 |\n", "| value_loss | 487 |\n", "------------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 365 |\n", "| ep_rew_mean | 197 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 923 |\n", "| time_elapsed | 1647 |\n", "| total_timesteps | 945152 |\n", "| train/ | |\n", "| approx_kl | 0.00013846188 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.808 |\n", "| explained_variance | 0.76949006 |\n", "| learning_rate | 0.0003 |\n", "| loss | 447 |\n", "| n_updates | 3688 |\n", "| policy_gradient_loss | -0.000354 |\n", "| value_loss | 821 |\n", "-------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 364 |\n", "| ep_rew_mean | 195 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 924 |\n", "| time_elapsed | 1648 |\n", "| total_timesteps | 946176 |\n", "| train/ | |\n", "| approx_kl | 0.006481627 |\n", "| clip_fraction | 0.0378 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.619 |\n", "| explained_variance | 0.9789374 |\n", "| learning_rate | 0.0003 |\n", "| loss | 1.3 |\n", "| n_updates | 3692 |\n", "| policy_gradient_loss | -0.00361 |\n", "| value_loss | 9.58 |\n", "-----------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 365 |\n", "| ep_rew_mean | 197 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 925 |\n", "| time_elapsed | 1650 |\n", "| total_timesteps | 947200 |\n", "| train/ | |\n", "| approx_kl | 0.017931039 |\n", "| clip_fraction | 0.196 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.781 |\n", "| explained_variance | 0.64106184 |\n", "| learning_rate | 0.0003 |\n", "| loss | 1.07e+03 |\n", "| n_updates | 3696 |\n", "| policy_gradient_loss | 0.00412 |\n", "| value_loss | 1.6e+03 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 372 |\n", "| ep_rew_mean | 196 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 926 |\n", "| time_elapsed | 1652 |\n", "| total_timesteps | 948224 |\n", "| train/ | |\n", "| approx_kl | 0.0013018582 |\n", "| clip_fraction | 0.000732 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.73 |\n", "| explained_variance | 0.8789992 |\n", "| learning_rate | 0.0003 |\n", "| loss | 39.6 |\n", "| n_updates | 3700 |\n", "| policy_gradient_loss | -0.00116 |\n", "| value_loss | 267 |\n", "------------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 374 |\n", "| ep_rew_mean | 196 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 927 |\n", "| time_elapsed | 1653 |\n", "| total_timesteps | 949248 |\n", "| train/ | |\n", "| approx_kl | 0.00070313923 |\n", "| clip_fraction | 0.000244 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.598 |\n", "| explained_variance | 0.85627604 |\n", "| learning_rate | 0.0003 |\n", "| loss | 22.2 |\n", "| n_updates | 3704 |\n", "| policy_gradient_loss | -0.00055 |\n", "| value_loss | 97.9 |\n", "-------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 364 |\n", "| ep_rew_mean | 188 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 928 |\n", "| time_elapsed | 1655 |\n", "| total_timesteps | 950272 |\n", "| train/ | |\n", "| approx_kl | 0.0015090532 |\n", "| clip_fraction | 0.000488 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.664 |\n", "| explained_variance | 0.75784826 |\n", "| learning_rate | 0.0003 |\n", "| loss | 275 |\n", "| n_updates | 3708 |\n", "| policy_gradient_loss | -0.0017 |\n", "| value_loss | 685 |\n", "------------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 362 |\n", "| ep_rew_mean | 186 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 929 |\n", "| time_elapsed | 1657 |\n", "| total_timesteps | 951296 |\n", "| train/ | |\n", "| approx_kl | 0.00019730307 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.864 |\n", "| explained_variance | 0.56364137 |\n", "| learning_rate | 0.0003 |\n", "| loss | 742 |\n", "| n_updates | 3712 |\n", "| policy_gradient_loss | -0.000451 |\n", "| value_loss | 1.96e+03 |\n", "-------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 363 |\n", "| ep_rew_mean | 184 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 930 |\n", "| time_elapsed | 1659 |\n", "| total_timesteps | 952320 |\n", "| train/ | |\n", "| approx_kl | 0.0017948615 |\n", "| clip_fraction | 0.000488 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.721 |\n", "| explained_variance | 0.6812679 |\n", "| learning_rate | 0.0003 |\n", "| loss | 209 |\n", "| n_updates | 3716 |\n", "| policy_gradient_loss | -0.00167 |\n", "| value_loss | 355 |\n", "------------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 363 |\n", "| ep_rew_mean | 182 |\n", "| time/ | |\n", "| fps | 573 |\n", "| iterations | 931 |\n", "| time_elapsed | 1660 |\n", "| total_timesteps | 953344 |\n", "| train/ | |\n", "| approx_kl | 0.00047835434 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.712 |\n", "| explained_variance | 0.76666445 |\n", "| learning_rate | 0.0003 |\n", "| loss | 286 |\n", "| n_updates | 3720 |\n", "| policy_gradient_loss | -0.000666 |\n", "| value_loss | 554 |\n", "-------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 369 |\n", "| ep_rew_mean | 181 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 932 |\n", "| time_elapsed | 1662 |\n", "| total_timesteps | 954368 |\n", "| train/ | |\n", "| approx_kl | 0.0015587942 |\n", "| clip_fraction | 0.00659 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.618 |\n", "| explained_variance | 0.48605847 |\n", "| learning_rate | 0.0003 |\n", "| loss | 195 |\n", "| n_updates | 3724 |\n", "| policy_gradient_loss | -0.0016 |\n", "| value_loss | 734 |\n", "------------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 368 |\n", "| ep_rew_mean | 179 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 933 |\n", "| time_elapsed | 1664 |\n", "| total_timesteps | 955392 |\n", "| train/ | |\n", "| approx_kl | 0.00016462168 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.651 |\n", "| explained_variance | 0.6087233 |\n", "| learning_rate | 0.0003 |\n", "| loss | 56.7 |\n", "| n_updates | 3728 |\n", "| policy_gradient_loss | 4e-05 |\n", "| value_loss | 299 |\n", "-------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 365 |\n", "| ep_rew_mean | 174 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 934 |\n", "| time_elapsed | 1665 |\n", "| total_timesteps | 956416 |\n", "| train/ | |\n", "| approx_kl | 0.0019175424 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.746 |\n", "| explained_variance | 0.64325887 |\n", "| learning_rate | 0.0003 |\n", "| loss | 163 |\n", "| n_updates | 3732 |\n", "| policy_gradient_loss | -0.00186 |\n", "| value_loss | 434 |\n", "------------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 364 |\n", "| ep_rew_mean | 173 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 935 |\n", "| time_elapsed | 1667 |\n", "| total_timesteps | 957440 |\n", "| train/ | |\n", "| approx_kl | 0.00044753368 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.812 |\n", "| explained_variance | 0.7083135 |\n", "| learning_rate | 0.0003 |\n", "| loss | 509 |\n", "| n_updates | 3736 |\n", "| policy_gradient_loss | -0.000317 |\n", "| value_loss | 1.29e+03 |\n", "-------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 363 |\n", "| ep_rew_mean | 171 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 936 |\n", "| time_elapsed | 1669 |\n", "| total_timesteps | 958464 |\n", "| train/ | |\n", "| approx_kl | 0.0016002292 |\n", "| clip_fraction | 0.00269 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.794 |\n", "| explained_variance | 0.5478834 |\n", "| learning_rate | 0.0003 |\n", "| loss | 369 |\n", "| n_updates | 3740 |\n", "| policy_gradient_loss | -0.000635 |\n", "| value_loss | 836 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 362 |\n", "| ep_rew_mean | 170 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 937 |\n", "| time_elapsed | 1671 |\n", "| total_timesteps | 959488 |\n", "| train/ | |\n", "| approx_kl | 0.0005042678 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.769 |\n", "| explained_variance | -0.11804533 |\n", "| learning_rate | 0.0003 |\n", "| loss | 282 |\n", "| n_updates | 3744 |\n", "| policy_gradient_loss | -0.000857 |\n", "| value_loss | 807 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 362 |\n", "| ep_rew_mean | 171 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 938 |\n", "| time_elapsed | 1673 |\n", "| total_timesteps | 960512 |\n", "| train/ | |\n", "| approx_kl | 0.0023835849 |\n", "| clip_fraction | 0.00659 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.667 |\n", "| explained_variance | 0.5829898 |\n", "| learning_rate | 0.0003 |\n", "| loss | 46.5 |\n", "| n_updates | 3748 |\n", "| policy_gradient_loss | -0.00307 |\n", "| value_loss | 195 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 362 |\n", "| ep_rew_mean | 172 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 939 |\n", "| time_elapsed | 1674 |\n", "| total_timesteps | 961536 |\n", "| train/ | |\n", "| approx_kl | 0.0011906102 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.734 |\n", "| explained_variance | 0.3353035 |\n", "| learning_rate | 0.0003 |\n", "| loss | 414 |\n", "| n_updates | 3752 |\n", "| policy_gradient_loss | -0.000243 |\n", "| value_loss | 666 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 359 |\n", "| ep_rew_mean | 167 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 940 |\n", "| time_elapsed | 1676 |\n", "| total_timesteps | 962560 |\n", "| train/ | |\n", "| approx_kl | 0.001066558 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.713 |\n", "| explained_variance | 0.61485755 |\n", "| learning_rate | 0.0003 |\n", "| loss | 395 |\n", "| n_updates | 3756 |\n", "| policy_gradient_loss | -0.00089 |\n", "| value_loss | 507 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 356 |\n", "| ep_rew_mean | 163 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 941 |\n", "| time_elapsed | 1678 |\n", "| total_timesteps | 963584 |\n", "| train/ | |\n", "| approx_kl | 0.0016088514 |\n", "| clip_fraction | 0.000244 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.815 |\n", "| explained_variance | 0.6164469 |\n", "| learning_rate | 0.0003 |\n", "| loss | 489 |\n", "| n_updates | 3760 |\n", "| policy_gradient_loss | -0.00238 |\n", "| value_loss | 1.04e+03 |\n", "------------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 347 |\n", "| ep_rew_mean | 162 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 942 |\n", "| time_elapsed | 1680 |\n", "| total_timesteps | 964608 |\n", "| train/ | |\n", "| approx_kl | 0.00038261525 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.814 |\n", "| explained_variance | 0.7389965 |\n", "| learning_rate | 0.0003 |\n", "| loss | 220 |\n", "| n_updates | 3764 |\n", "| policy_gradient_loss | -0.000272 |\n", "| value_loss | 763 |\n", "-------------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 347 |\n", "| ep_rew_mean | 160 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 943 |\n", "| time_elapsed | 1682 |\n", "| total_timesteps | 965632 |\n", "| train/ | |\n", "| approx_kl | 0.00067269587 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.755 |\n", "| explained_variance | 0.6806197 |\n", "| learning_rate | 0.0003 |\n", "| loss | 136 |\n", "| n_updates | 3768 |\n", "| policy_gradient_loss | -0.000891 |\n", "| value_loss | 483 |\n", "-------------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 347 |\n", "| ep_rew_mean | 160 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 944 |\n", "| time_elapsed | 1683 |\n", "| total_timesteps | 966656 |\n", "| train/ | |\n", "| approx_kl | 0.00043768832 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.708 |\n", "| explained_variance | 0.7035491 |\n", "| learning_rate | 0.0003 |\n", "| loss | 241 |\n", "| n_updates | 3772 |\n", "| policy_gradient_loss | -0.000849 |\n", "| value_loss | 461 |\n", "-------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 348 |\n", "| ep_rew_mean | 165 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 945 |\n", "| time_elapsed | 1685 |\n", "| total_timesteps | 967680 |\n", "| train/ | |\n", "| approx_kl | 0.0007155647 |\n", "| clip_fraction | 0.000488 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.702 |\n", "| explained_variance | 0.54920614 |\n", "| learning_rate | 0.0003 |\n", "| loss | 120 |\n", "| n_updates | 3776 |\n", "| policy_gradient_loss | -0.000387 |\n", "| value_loss | 600 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 344 |\n", "| ep_rew_mean | 160 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 946 |\n", "| time_elapsed | 1687 |\n", "| total_timesteps | 968704 |\n", "| train/ | |\n", "| approx_kl | 0.004915016 |\n", "| clip_fraction | 0.0188 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.745 |\n", "| explained_variance | 0.8385835 |\n", "| learning_rate | 0.0003 |\n", "| loss | 15.9 |\n", "| n_updates | 3780 |\n", "| policy_gradient_loss | -0.00155 |\n", "| value_loss | 82.4 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 343 |\n", "| ep_rew_mean | 156 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 947 |\n", "| time_elapsed | 1688 |\n", "| total_timesteps | 969728 |\n", "| train/ | |\n", "| approx_kl | 0.0005995464 |\n", "| clip_fraction | 0.000244 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.719 |\n", "| explained_variance | 0.32498848 |\n", "| learning_rate | 0.0003 |\n", "| loss | 551 |\n", "| n_updates | 3784 |\n", "| policy_gradient_loss | -0.000698 |\n", "| value_loss | 1.8e+03 |\n", "------------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 340 |\n", "| ep_rew_mean | 154 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 948 |\n", "| time_elapsed | 1690 |\n", "| total_timesteps | 970752 |\n", "| train/ | |\n", "| approx_kl | 0.00050075527 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.794 |\n", "| explained_variance | 0.4664073 |\n", "| learning_rate | 0.0003 |\n", "| loss | 538 |\n", "| n_updates | 3788 |\n", "| policy_gradient_loss | -0.0012 |\n", "| value_loss | 1.07e+03 |\n", "-------------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 342 |\n", "| ep_rew_mean | 158 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 949 |\n", "| time_elapsed | 1692 |\n", "| total_timesteps | 971776 |\n", "| train/ | |\n", "| approx_kl | 0.00011092465 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.759 |\n", "| explained_variance | 0.5170304 |\n", "| learning_rate | 0.0003 |\n", "| loss | 437 |\n", "| n_updates | 3792 |\n", "| policy_gradient_loss | -0.000128 |\n", "| value_loss | 1.15e+03 |\n", "-------------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 341 |\n", "| ep_rew_mean | 158 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 950 |\n", "| time_elapsed | 1694 |\n", "| total_timesteps | 972800 |\n", "| train/ | |\n", "| approx_kl | 0.00037158508 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.658 |\n", "| explained_variance | 0.6244669 |\n", "| learning_rate | 0.0003 |\n", "| loss | 42.8 |\n", "| n_updates | 3796 |\n", "| policy_gradient_loss | -2.36e-05 |\n", "| value_loss | 214 |\n", "-------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 335 |\n", "| ep_rew_mean | 161 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 951 |\n", "| time_elapsed | 1696 |\n", "| total_timesteps | 973824 |\n", "| train/ | |\n", "| approx_kl | 0.0008543365 |\n", "| clip_fraction | 0.000244 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.688 |\n", "| explained_variance | 0.59470785 |\n", "| learning_rate | 0.0003 |\n", "| loss | 92.2 |\n", "| n_updates | 3800 |\n", "| policy_gradient_loss | -0.00131 |\n", "| value_loss | 559 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 336 |\n", "| ep_rew_mean | 161 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 952 |\n", "| time_elapsed | 1697 |\n", "| total_timesteps | 974848 |\n", "| train/ | |\n", "| approx_kl | 0.0042348113 |\n", "| clip_fraction | 0.0361 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.733 |\n", "| explained_variance | 0.65124595 |\n", "| learning_rate | 0.0003 |\n", "| loss | 39.7 |\n", "| n_updates | 3804 |\n", "| policy_gradient_loss | -0.00361 |\n", "| value_loss | 136 |\n", "------------------------------------------\n", "----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 341 |\n", "| ep_rew_mean | 161 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 953 |\n", "| time_elapsed | 1699 |\n", "| total_timesteps | 975872 |\n", "| train/ | |\n", "| approx_kl | 0.00395691 |\n", "| clip_fraction | 0.0239 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.678 |\n", "| explained_variance | 0.92574924 |\n", "| learning_rate | 0.0003 |\n", "| loss | 9.64 |\n", "| n_updates | 3808 |\n", "| policy_gradient_loss | -0.00209 |\n", "| value_loss | 43.8 |\n", "----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 340 |\n", "| ep_rew_mean | 161 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 954 |\n", "| time_elapsed | 1701 |\n", "| total_timesteps | 976896 |\n", "| train/ | |\n", "| approx_kl | 0.0008127556 |\n", "| clip_fraction | 0.0239 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.71 |\n", "| explained_variance | 0.6488405 |\n", "| learning_rate | 0.0003 |\n", "| loss | 254 |\n", "| n_updates | 3812 |\n", "| policy_gradient_loss | 0.000521 |\n", "| value_loss | 580 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 342 |\n", "| ep_rew_mean | 168 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 955 |\n", "| time_elapsed | 1703 |\n", "| total_timesteps | 977920 |\n", "| train/ | |\n", "| approx_kl | 0.0027752307 |\n", "| clip_fraction | 0.00195 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.68 |\n", "| explained_variance | 0.7177346 |\n", "| learning_rate | 0.0003 |\n", "| loss | 31 |\n", "| n_updates | 3816 |\n", "| policy_gradient_loss | -0.000946 |\n", "| value_loss | 181 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 336 |\n", "| ep_rew_mean | 169 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 956 |\n", "| time_elapsed | 1705 |\n", "| total_timesteps | 978944 |\n", "| train/ | |\n", "| approx_kl | 0.0054516997 |\n", "| clip_fraction | 0.0193 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.728 |\n", "| explained_variance | 0.6541332 |\n", "| learning_rate | 0.0003 |\n", "| loss | 20 |\n", "| n_updates | 3820 |\n", "| policy_gradient_loss | -0.0018 |\n", "| value_loss | 87.9 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 339 |\n", "| ep_rew_mean | 176 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 957 |\n", "| time_elapsed | 1707 |\n", "| total_timesteps | 979968 |\n", "| train/ | |\n", "| approx_kl | 0.0010803475 |\n", "| clip_fraction | 0.000977 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.729 |\n", "| explained_variance | 0.6072459 |\n", "| learning_rate | 0.0003 |\n", "| loss | 455 |\n", "| n_updates | 3824 |\n", "| policy_gradient_loss | 0.00105 |\n", "| value_loss | 739 |\n", "------------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 332 |\n", "| ep_rew_mean | 177 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 958 |\n", "| time_elapsed | 1708 |\n", "| total_timesteps | 980992 |\n", "| train/ | |\n", "| approx_kl | 0.00021313265 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.741 |\n", "| explained_variance | 0.568452 |\n", "| learning_rate | 0.0003 |\n", "| loss | 31.7 |\n", "| n_updates | 3828 |\n", "| policy_gradient_loss | 0.000182 |\n", "| value_loss | 196 |\n", "-------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 325 |\n", "| ep_rew_mean | 175 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 959 |\n", "| time_elapsed | 1710 |\n", "| total_timesteps | 982016 |\n", "| train/ | |\n", "| approx_kl | 0.0034031942 |\n", "| clip_fraction | 0.0115 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.77 |\n", "| explained_variance | 0.72318256 |\n", "| learning_rate | 0.0003 |\n", "| loss | 45.9 |\n", "| n_updates | 3832 |\n", "| policy_gradient_loss | -0.00108 |\n", "| value_loss | 484 |\n", "------------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 328 |\n", "| ep_rew_mean | 179 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 960 |\n", "| time_elapsed | 1712 |\n", "| total_timesteps | 983040 |\n", "| train/ | |\n", "| approx_kl | 0.00041980232 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.784 |\n", "| explained_variance | 0.6822001 |\n", "| learning_rate | 0.0003 |\n", "| loss | 936 |\n", "| n_updates | 3836 |\n", "| policy_gradient_loss | -0.00035 |\n", "| value_loss | 1.33e+03 |\n", "-------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 333 |\n", "| ep_rew_mean | 181 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 961 |\n", "| time_elapsed | 1713 |\n", "| total_timesteps | 984064 |\n", "| train/ | |\n", "| approx_kl | 0.003771958 |\n", "| clip_fraction | 0.0122 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.72 |\n", "| explained_variance | 0.383628 |\n", "| learning_rate | 0.0003 |\n", "| loss | 89.3 |\n", "| n_updates | 3840 |\n", "| policy_gradient_loss | -0.00246 |\n", "| value_loss | 907 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 333 |\n", "| ep_rew_mean | 183 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 962 |\n", "| time_elapsed | 1715 |\n", "| total_timesteps | 985088 |\n", "| train/ | |\n", "| approx_kl | 0.0029577098 |\n", "| clip_fraction | 0.0322 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.659 |\n", "| explained_variance | 0.9558869 |\n", "| learning_rate | 0.0003 |\n", "| loss | 11.8 |\n", "| n_updates | 3844 |\n", "| policy_gradient_loss | -0.00193 |\n", "| value_loss | 43.7 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 334 |\n", "| ep_rew_mean | 185 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 963 |\n", "| time_elapsed | 1717 |\n", "| total_timesteps | 986112 |\n", "| train/ | |\n", "| approx_kl | 0.0060834624 |\n", "| clip_fraction | 0.0298 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.676 |\n", "| explained_variance | 0.78245705 |\n", "| learning_rate | 0.0003 |\n", "| loss | 15.1 |\n", "| n_updates | 3848 |\n", "| policy_gradient_loss | -0.00367 |\n", "| value_loss | 109 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 325 |\n", "| ep_rew_mean | 182 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 964 |\n", "| time_elapsed | 1719 |\n", "| total_timesteps | 987136 |\n", "| train/ | |\n", "| approx_kl | 0.009996594 |\n", "| clip_fraction | 0.0366 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.694 |\n", "| explained_variance | 0.8424798 |\n", "| learning_rate | 0.0003 |\n", "| loss | 9.92 |\n", "| n_updates | 3852 |\n", "| policy_gradient_loss | -0.000621 |\n", "| value_loss | 50.4 |\n", "-----------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 335 |\n", "| ep_rew_mean | 181 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 965 |\n", "| time_elapsed | 1721 |\n", "| total_timesteps | 988160 |\n", "| train/ | |\n", "| approx_kl | 0.004928575 |\n", "| clip_fraction | 0.114 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.745 |\n", "| explained_variance | 0.2651494 |\n", "| learning_rate | 0.0003 |\n", "| loss | 513 |\n", "| n_updates | 3856 |\n", "| policy_gradient_loss | 0.00203 |\n", "| value_loss | 1.52e+03 |\n", "-----------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 336 |\n", "| ep_rew_mean | 183 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 966 |\n", "| time_elapsed | 1722 |\n", "| total_timesteps | 989184 |\n", "| train/ | |\n", "| approx_kl | 0.005871132 |\n", "| clip_fraction | 0.0454 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.728 |\n", "| explained_variance | 0.9754874 |\n", "| learning_rate | 0.0003 |\n", "| loss | 15.5 |\n", "| n_updates | 3860 |\n", "| policy_gradient_loss | -0.00215 |\n", "| value_loss | 26.2 |\n", "-----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 338 |\n", "| ep_rew_mean | 187 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 967 |\n", "| time_elapsed | 1724 |\n", "| total_timesteps | 990208 |\n", "| train/ | |\n", "| approx_kl | 0.0032056416 |\n", "| clip_fraction | 0.0127 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.688 |\n", "| explained_variance | 0.95287293 |\n", "| learning_rate | 0.0003 |\n", "| loss | 7.92 |\n", "| n_updates | 3864 |\n", "| policy_gradient_loss | 0.000475 |\n", "| value_loss | 24.7 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 344 |\n", "| ep_rew_mean | 191 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 968 |\n", "| time_elapsed | 1726 |\n", "| total_timesteps | 991232 |\n", "| train/ | |\n", "| approx_kl | 0.0040416047 |\n", "| clip_fraction | 0.0349 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.684 |\n", "| explained_variance | 0.9252282 |\n", "| learning_rate | 0.0003 |\n", "| loss | 15.9 |\n", "| n_updates | 3868 |\n", "| policy_gradient_loss | -0.000196 |\n", "| value_loss | 42.4 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 343 |\n", "| ep_rew_mean | 191 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 969 |\n", "| time_elapsed | 1728 |\n", "| total_timesteps | 992256 |\n", "| train/ | |\n", "| approx_kl | 0.0036541708 |\n", "| clip_fraction | 0.0391 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.611 |\n", "| explained_variance | 0.97556317 |\n", "| learning_rate | 0.0003 |\n", "| loss | 11 |\n", "| n_updates | 3872 |\n", "| policy_gradient_loss | -0.00328 |\n", "| value_loss | 27.4 |\n", "------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 345 |\n", "| ep_rew_mean | 191 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 970 |\n", "| time_elapsed | 1730 |\n", "| total_timesteps | 993280 |\n", "| train/ | |\n", "| approx_kl | 0.0030540614 |\n", "| clip_fraction | 0.0256 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.77 |\n", "| explained_variance | 0.44396192 |\n", "| learning_rate | 0.0003 |\n", "| loss | 292 |\n", "| n_updates | 3876 |\n", "| policy_gradient_loss | -0.00294 |\n", "| value_loss | 1.02e+03 |\n", "------------------------------------------\n", "-----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 343 |\n", "| ep_rew_mean | 189 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 971 |\n", "| time_elapsed | 1731 |\n", "| total_timesteps | 994304 |\n", "| train/ | |\n", "| approx_kl | 0.004856142 |\n", "| clip_fraction | 0.0388 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.659 |\n", "| explained_variance | 0.9320221 |\n", "| learning_rate | 0.0003 |\n", "| loss | 10.2 |\n", "| n_updates | 3880 |\n", "| policy_gradient_loss | -0.00555 |\n", "| value_loss | 42.8 |\n", "-----------------------------------------\n", "----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 342 |\n", "| ep_rew_mean | 189 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 972 |\n", "| time_elapsed | 1733 |\n", "| total_timesteps | 995328 |\n", "| train/ | |\n", "| approx_kl | 0.00572942 |\n", "| clip_fraction | 0.0759 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.707 |\n", "| explained_variance | 0.7027645 |\n", "| learning_rate | 0.0003 |\n", "| loss | 607 |\n", "| n_updates | 3884 |\n", "| policy_gradient_loss | -0.00442 |\n", "| value_loss | 632 |\n", "----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 341 |\n", "| ep_rew_mean | 188 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 973 |\n", "| time_elapsed | 1735 |\n", "| total_timesteps | 996352 |\n", "| train/ | |\n", "| approx_kl | 0.0061508454 |\n", "| clip_fraction | 0.0276 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.793 |\n", "| explained_variance | 0.56833816 |\n", "| learning_rate | 0.0003 |\n", "| loss | 243 |\n", "| n_updates | 3888 |\n", "| policy_gradient_loss | -0.00239 |\n", "| value_loss | 839 |\n", "------------------------------------------\n", "-------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 344 |\n", "| ep_rew_mean | 192 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 974 |\n", "| time_elapsed | 1736 |\n", "| total_timesteps | 997376 |\n", "| train/ | |\n", "| approx_kl | 0.00078091223 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.794 |\n", "| explained_variance | 0.5936359 |\n", "| learning_rate | 0.0003 |\n", "| loss | 940 |\n", "| n_updates | 3892 |\n", "| policy_gradient_loss | -0.00137 |\n", "| value_loss | 1.6e+03 |\n", "-------------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 344 |\n", "| ep_rew_mean | 190 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 975 |\n", "| time_elapsed | 1738 |\n", "| total_timesteps | 998400 |\n", "| train/ | |\n", "| approx_kl | 0.0013776363 |\n", "| clip_fraction | 0.00195 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.752 |\n", "| explained_variance | 0.7074866 |\n", "| learning_rate | 0.0003 |\n", "| loss | 258 |\n", "| n_updates | 3896 |\n", "| policy_gradient_loss | -0.00179 |\n", "| value_loss | 420 |\n", "------------------------------------------\n", "----------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 345 |\n", "| ep_rew_mean | 189 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 976 |\n", "| time_elapsed | 1740 |\n", "| total_timesteps | 999424 |\n", "| train/ | |\n", "| approx_kl | 0.00030336 |\n", "| clip_fraction | 0 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.832 |\n", "| explained_variance | 0.695728 |\n", "| learning_rate | 0.0003 |\n", "| loss | 437 |\n", "| n_updates | 3900 |\n", "| policy_gradient_loss | -0.000441 |\n", "| value_loss | 1.49e+03 |\n", "----------------------------------------\n", "------------------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 344 |\n", "| ep_rew_mean | 191 |\n", "| time/ | |\n", "| fps | 574 |\n", "| iterations | 977 |\n", "| time_elapsed | 1742 |\n", "| total_timesteps | 1000448 |\n", "| train/ | |\n", "| approx_kl | 0.0028918108 |\n", "| clip_fraction | 0.0083 |\n", "| clip_range | 0.2 |\n", "| entropy_loss | -0.721 |\n", "| explained_variance | 0.84710467 |\n", "| learning_rate | 0.0003 |\n", "| loss | 97.8 |\n", "| n_updates | 3904 |\n", "| policy_gradient_loss | -0.00117 |\n", "| value_loss | 274 |\n", "------------------------------------------\n" ] } ] }, { "cell_type": "code", "source": [ "notebook_login()\n", "!git config --global credential.helper store" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 17, "referenced_widgets": [ "5e5f6d0bae264cb492b6dda56e53e074", "eebf76576b7b4b719ac57de36e66382b", "a1d0a8cf6fe54df887f65436d8935269", "10366c39d49b4e6cb3d44166590352fc", "145ed8fecddf49fe8f8f283d2d8ddab9", "96010313880644fa9b6293e41a150e5f", "bddcd0e0941f488fbb0d98ac264cb72a", "4e0e83a476a840fcb4c334efcd961a7a", "a17b3df99ee941ad838e1ed455663f54", "8e317e1fb21c46debc662b461e84c912", "1c304f3e820e4b899f5349181570ed6e", "19ca5e456206449796b620ee5ec7f9fd", "0bed7d5da23c4fcbb2ef5e663ecfaeb6", "861c2d5a72d34afab4e01ee72d6b23dc", "a25f6653fc0c4d599e16e8ad207e0884", "bbcc61b64eed4d2ea96e679ed66675af", "6f78af7746864b40a1531f35e0e3ac11", "bad0550de5fc4c46acbae99e23dc164a", "3df1ff9d97f141b0920407e52c698947", "3e5cea3b91364b98bc36cb0e7c257043" ] }, "id": "vug50fNKxnCg", "outputId": "6b49b1c7-965b-4e80-ba60-6920e38b595c" }, "execution_count": 9, "outputs": [ { "output_type": "display_data", "data": { "text/plain": [ "VBox(children=(HTML(value='