Buckets:

rtrm's picture
download
raw
30.6 kB
<meta charset="utf-8" /><meta name="hf:doc:metadata" content="{&quot;title&quot;:&quot;Welcome to the 🤗 Deep Reinforcement Learning Course&quot;,&quot;local&quot;:&quot;introduction&quot;,&quot;sections&quot;:[{&quot;title&quot;:&quot;What to expect?&quot;,&quot;local&quot;:&quot;expect&quot;,&quot;sections&quot;:[],&quot;depth&quot;:2},{&quot;title&quot;:&quot;What does the course look like?&quot;,&quot;local&quot;:&quot;course-look-like&quot;,&quot;sections&quot;:[],&quot;depth&quot;:2},{&quot;title&quot;:&quot;What’s the syllabus?&quot;,&quot;local&quot;:&quot;syllabus&quot;,&quot;sections&quot;:[],&quot;depth&quot;:2},{&quot;title&quot;:&quot;Two paths: choose your own adventure&quot;,&quot;local&quot;:&quot;two-paths&quot;,&quot;sections&quot;:[],&quot;depth&quot;:2},{&quot;title&quot;:&quot;The Certification Process&quot;,&quot;local&quot;:&quot;certification-process&quot;,&quot;sections&quot;:[],&quot;depth&quot;:2},{&quot;title&quot;:&quot;How to get most of the course?&quot;,&quot;local&quot;:&quot;advice&quot;,&quot;sections&quot;:[],&quot;depth&quot;:2},{&quot;title&quot;:&quot;What tools do I need?&quot;,&quot;local&quot;:&quot;tools&quot;,&quot;sections&quot;:[],&quot;depth&quot;:2},{&quot;title&quot;:&quot;What is the recommended pace?&quot;,&quot;local&quot;:&quot;recommended-pace&quot;,&quot;sections&quot;:[],&quot;depth&quot;:2},{&quot;title&quot;:&quot;Who are we&quot;,&quot;local&quot;:&quot;who-are-we&quot;,&quot;sections&quot;:[],&quot;depth&quot;:2},{&quot;title&quot;:&quot;What are the challenges in this course?&quot;,&quot;local&quot;:&quot;challenges&quot;,&quot;sections&quot;:[],&quot;depth&quot;:2},{&quot;title&quot;:&quot;I found a bug, or I want to improve the course&quot;,&quot;local&quot;:&quot;contribute&quot;,&quot;sections&quot;:[],&quot;depth&quot;:2},{&quot;title&quot;:&quot;I still have questions&quot;,&quot;local&quot;:&quot;questions&quot;,&quot;sections&quot;:[],&quot;depth&quot;:2}],&quot;depth&quot;:1}">
<link href="/docs/deep-rl-course/pr_587/en/_app/immutable/assets/0.e3b0c442.css" rel="modulepreload">
<link rel="modulepreload" href="/docs/deep-rl-course/pr_587/en/_app/immutable/entry/start.7c4c7929.js">
<link rel="modulepreload" href="/docs/deep-rl-course/pr_587/en/_app/immutable/chunks/scheduler.37c15a92.js">
<link rel="modulepreload" href="/docs/deep-rl-course/pr_587/en/_app/immutable/chunks/singletons.945d9b5d.js">
<link rel="modulepreload" href="/docs/deep-rl-course/pr_587/en/_app/immutable/chunks/index.18351ede.js">
<link rel="modulepreload" href="/docs/deep-rl-course/pr_587/en/_app/immutable/chunks/paths.9ffa1e06.js">
<link rel="modulepreload" href="/docs/deep-rl-course/pr_587/en/_app/immutable/entry/app.d2a43a08.js">
<link rel="modulepreload" href="/docs/deep-rl-course/pr_587/en/_app/immutable/chunks/index.7cb9c9b8.js">
<link rel="modulepreload" href="/docs/deep-rl-course/pr_587/en/_app/immutable/nodes/0.e67798fa.js">
<link rel="modulepreload" href="/docs/deep-rl-course/pr_587/en/_app/immutable/chunks/each.e59479a4.js">
<link rel="modulepreload" href="/docs/deep-rl-course/pr_587/en/_app/immutable/nodes/6.b0856558.js">
<link rel="modulepreload" href="/docs/deep-rl-course/pr_587/en/_app/immutable/chunks/EditOnGithub.858acfec.js"><!-- HEAD_svelte-u9bgzb_START --><meta name="hf:doc:metadata" content="{&quot;title&quot;:&quot;Welcome to the 🤗 Deep Reinforcement Learning Course&quot;,&quot;local&quot;:&quot;introduction&quot;,&quot;sections&quot;:[{&quot;title&quot;:&quot;What to expect?&quot;,&quot;local&quot;:&quot;expect&quot;,&quot;sections&quot;:[],&quot;depth&quot;:2},{&quot;title&quot;:&quot;What does the course look like?&quot;,&quot;local&quot;:&quot;course-look-like&quot;,&quot;sections&quot;:[],&quot;depth&quot;:2},{&quot;title&quot;:&quot;What’s the syllabus?&quot;,&quot;local&quot;:&quot;syllabus&quot;,&quot;sections&quot;:[],&quot;depth&quot;:2},{&quot;title&quot;:&quot;Two paths: choose your own adventure&quot;,&quot;local&quot;:&quot;two-paths&quot;,&quot;sections&quot;:[],&quot;depth&quot;:2},{&quot;title&quot;:&quot;The Certification Process&quot;,&quot;local&quot;:&quot;certification-process&quot;,&quot;sections&quot;:[],&quot;depth&quot;:2},{&quot;title&quot;:&quot;How to get most of the course?&quot;,&quot;local&quot;:&quot;advice&quot;,&quot;sections&quot;:[],&quot;depth&quot;:2},{&quot;title&quot;:&quot;What tools do I need?&quot;,&quot;local&quot;:&quot;tools&quot;,&quot;sections&quot;:[],&quot;depth&quot;:2},{&quot;title&quot;:&quot;What is the recommended pace?&quot;,&quot;local&quot;:&quot;recommended-pace&quot;,&quot;sections&quot;:[],&quot;depth&quot;:2},{&quot;title&quot;:&quot;Who are we&quot;,&quot;local&quot;:&quot;who-are-we&quot;,&quot;sections&quot;:[],&quot;depth&quot;:2},{&quot;title&quot;:&quot;What are the challenges in this course?&quot;,&quot;local&quot;:&quot;challenges&quot;,&quot;sections&quot;:[],&quot;depth&quot;:2},{&quot;title&quot;:&quot;I found a bug, or I want to improve the course&quot;,&quot;local&quot;:&quot;contribute&quot;,&quot;sections&quot;:[],&quot;depth&quot;:2},{&quot;title&quot;:&quot;I still have questions&quot;,&quot;local&quot;:&quot;questions&quot;,&quot;sections&quot;:[],&quot;depth&quot;:2}],&quot;depth&quot;:1}"><!-- HEAD_svelte-u9bgzb_END --> <p></p> <h1 class="relative group"><a id="introduction" class="header-link block pr-1.5 text-lg no-hover:hidden with-hover:absolute with-hover:p-1.5 with-hover:opacity-0 with-hover:group-hover:opacity-100 with-hover:right-full" href="#introduction"><span><svg class="" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" role="img" width="1em" height="1em" preserveAspectRatio="xMidYMid meet" viewBox="0 0 256 256"><path d="M167.594 88.393a8.001 8.001 0 0 1 0 11.314l-67.882 67.882a8 8 0 1 1-11.314-11.315l67.882-67.881a8.003 8.003 0 0 1 11.314 0zm-28.287 84.86l-28.284 28.284a40 40 0 0 1-56.567-56.567l28.284-28.284a8 8 0 0 0-11.315-11.315l-28.284 28.284a56 56 0 0 0 79.196 79.197l28.285-28.285a8 8 0 1 0-11.315-11.314zM212.852 43.14a56.002 56.002 0 0 0-79.196 0l-28.284 28.284a8 8 0 1 0 11.314 11.314l28.284-28.284a40 40 0 0 1 56.568 56.567l-28.285 28.285a8 8 0 0 0 11.315 11.314l28.284-28.284a56.065 56.065 0 0 0 0-79.196z" fill="currentColor"></path></svg></span></a> <span>Welcome to the 🤗 Deep Reinforcement Learning Course</span></h1> <img src="https://huggingface.co/datasets/huggingface-deep-rl-course/course-images/resolve/main/en/unit0/thumbnail.jpg" alt="Deep RL Course thumbnail" width="100%"> <p data-svelte-h="svelte-lar89z">Welcome to the most fascinating topic in Artificial Intelligence: <strong>Deep Reinforcement Learning</strong>.</p> <p data-svelte-h="svelte-9h5dhu">This course will <strong>teach you about Deep Reinforcement Learning from beginner to expert</strong>. It’s completely free and open-source!</p> <p data-svelte-h="svelte-q5r4ab">In this introduction unit you’ll:</p> <ul data-svelte-h="svelte-iulplw"><li>Learn more about the <strong>course content</strong>.</li> <li><strong>Define the path</strong> you’re going to take (either self-audit or certification process).</li> <li>Learn more about the <strong>AI vs. AI challenges</strong> you’re going to participate in.</li> <li>Learn more <strong>about us</strong>.</li> <li><strong>Create your Hugging Face account</strong> (it’s free).</li> <li><strong>Sign-up to our Discord server</strong>, the place where you can chat with your classmates and us (the Hugging Face team).</li></ul> <p data-svelte-h="svelte-4b3xjd">Let’s get started!</p> <h2 class="relative group"><a id="expect" class="header-link block pr-1.5 text-lg no-hover:hidden with-hover:absolute with-hover:p-1.5 with-hover:opacity-0 with-hover:group-hover:opacity-100 with-hover:right-full" href="#expect"><span><svg class="" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" role="img" width="1em" height="1em" preserveAspectRatio="xMidYMid meet" viewBox="0 0 256 256"><path d="M167.594 88.393a8.001 8.001 0 0 1 0 11.314l-67.882 67.882a8 8 0 1 1-11.314-11.315l67.882-67.881a8.003 8.003 0 0 1 11.314 0zm-28.287 84.86l-28.284 28.284a40 40 0 0 1-56.567-56.567l28.284-28.284a8 8 0 0 0-11.315-11.315l-28.284 28.284a56 56 0 0 0 79.196 79.197l28.285-28.285a8 8 0 1 0-11.315-11.314zM212.852 43.14a56.002 56.002 0 0 0-79.196 0l-28.284 28.284a8 8 0 1 0 11.314 11.314l28.284-28.284a40 40 0 0 1 56.568 56.567l-28.285 28.285a8 8 0 0 0 11.315 11.314l28.284-28.284a56.065 56.065 0 0 0 0-79.196z" fill="currentColor"></path></svg></span></a> <span>What to expect?</span></h2> <p data-svelte-h="svelte-f2qxb3">In this course, you will:</p> <ul data-svelte-h="svelte-kd6znf"><li>📖 Study Deep Reinforcement Learning in <strong>theory and practice.</strong></li> <li>🧑‍💻 Learn to <strong>use famous Deep RL libraries</strong> such as <a href="https://stable-baselines3.readthedocs.io/en/master/" rel="nofollow">Stable Baselines3</a>, <a href="https://github.com/DLR-RM/rl-baselines3-zoo" rel="nofollow">RL Baselines3 Zoo</a>, <a href="https://samplefactory.dev/" rel="nofollow">Sample Factory</a> and <a href="https://github.com/vwxyzjn/cleanrl" rel="nofollow">CleanRL</a>.</li> <li>🤖 <strong>Train agents in unique environments</strong> such as <a href="https://huggingface.co/spaces/ThomasSimonini/SnowballFight" rel="nofollow">SnowballFight</a>, <a href="https://huggingface.co/spaces/ThomasSimonini/Huggy" rel="nofollow">Huggy the Doggo 🐶</a>, <a href="https://vizdoom.cs.put.edu.pl/" rel="nofollow">VizDoom (Doom)</a> and classical ones such as <a href="https://gymnasium.farama.org/environments/atari/space_invaders/" rel="nofollow">Space Invaders</a>, <a href="https://pybullet.org/wordpress/" rel="nofollow">PyBullet</a> and more.</li> <li>💾 Share your <strong>trained agents with one line of code to the Hub</strong> and also download powerful agents from the community.</li> <li>🏆 Participate in challenges where you will <strong>evaluate your agents against other teams. You’ll also get to play against the agents you’ll train.</strong></li> <li>🎓 <strong>Earn a certificate of completion</strong> by completing 80% of the assignments.</li></ul> <p data-svelte-h="svelte-t67g99">And more!</p> <p data-svelte-h="svelte-1xij83d">At the end of this course, <strong>you’ll get a solid foundation from the basics to the SOTA (state-of-the-art) of methods</strong>.</p> <p data-svelte-h="svelte-i91mrq">Don’t forget to <strong><a href="http://eepurl.com/ic5ZUD">sign up to the course</a></strong> (we are collecting your email to be able to <strong>send you the links when each Unit is published and give you information about the challenges and updates).</strong></p> <p data-svelte-h="svelte-a79ye4">Sign up 👉 <a href="http://eepurl.com/ic5ZUD">here</a></p> <h2 class="relative group"><a id="course-look-like" class="header-link block pr-1.5 text-lg no-hover:hidden with-hover:absolute with-hover:p-1.5 with-hover:opacity-0 with-hover:group-hover:opacity-100 with-hover:right-full" href="#course-look-like"><span><svg class="" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" role="img" width="1em" height="1em" preserveAspectRatio="xMidYMid meet" viewBox="0 0 256 256"><path d="M167.594 88.393a8.001 8.001 0 0 1 0 11.314l-67.882 67.882a8 8 0 1 1-11.314-11.315l67.882-67.881a8.003 8.003 0 0 1 11.314 0zm-28.287 84.86l-28.284 28.284a40 40 0 0 1-56.567-56.567l28.284-28.284a8 8 0 0 0-11.315-11.315l-28.284 28.284a56 56 0 0 0 79.196 79.197l28.285-28.285a8 8 0 1 0-11.315-11.314zM212.852 43.14a56.002 56.002 0 0 0-79.196 0l-28.284 28.284a8 8 0 1 0 11.314 11.314l28.284-28.284a40 40 0 0 1 56.568 56.567l-28.285 28.285a8 8 0 0 0 11.315 11.314l28.284-28.284a56.065 56.065 0 0 0 0-79.196z" fill="currentColor"></path></svg></span></a> <span>What does the course look like?</span></h2> <p data-svelte-h="svelte-1ee6w8b">The course is composed of:</p> <ul data-svelte-h="svelte-1ju8ahi"><li><p><em>A theory part</em>: where you learn a <strong>concept in theory</strong>.</p></li> <li><p><em>A hands-on</em>: where you’ll learn <strong>to use famous Deep RL libraries</strong> to train your agents in unique environments. These hands-on will be <strong>Google Colab notebooks with companion tutorial videos</strong> if you prefer learning with video format!</p></li> <li><p><em>Challenges</em>: you’ll get to put your agent to compete against other agents in different challenges. There will also be <a href="https://huggingface.co/spaces/huggingface-projects/Deep-Reinforcement-Learning-Leaderboard" rel="nofollow">a leaderboard</a> for you to compare the agents’ performance.</p></li></ul> <h2 class="relative group"><a id="syllabus" class="header-link block pr-1.5 text-lg no-hover:hidden with-hover:absolute with-hover:p-1.5 with-hover:opacity-0 with-hover:group-hover:opacity-100 with-hover:right-full" href="#syllabus"><span><svg class="" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" role="img" width="1em" height="1em" preserveAspectRatio="xMidYMid meet" viewBox="0 0 256 256"><path d="M167.594 88.393a8.001 8.001 0 0 1 0 11.314l-67.882 67.882a8 8 0 1 1-11.314-11.315l67.882-67.881a8.003 8.003 0 0 1 11.314 0zm-28.287 84.86l-28.284 28.284a40 40 0 0 1-56.567-56.567l28.284-28.284a8 8 0 0 0-11.315-11.315l-28.284 28.284a56 56 0 0 0 79.196 79.197l28.285-28.285a8 8 0 1 0-11.315-11.314zM212.852 43.14a56.002 56.002 0 0 0-79.196 0l-28.284 28.284a8 8 0 1 0 11.314 11.314l28.284-28.284a40 40 0 0 1 56.568 56.567l-28.285 28.285a8 8 0 0 0 11.315 11.314l28.284-28.284a56.065 56.065 0 0 0 0-79.196z" fill="currentColor"></path></svg></span></a> <span>What’s the syllabus?</span></h2> <p data-svelte-h="svelte-oyiyj9">This is the course’s syllabus:</p> <img src="https://huggingface.co/datasets/huggingface-deep-rl-course/course-images/resolve/main/en/unit0/syllabus1.jpg" alt="Syllabus Part 1" width="100%"> <img src="https://huggingface.co/datasets/huggingface-deep-rl-course/course-images/resolve/main/en/unit0/syllabus2.jpg" alt="Syllabus Part 2" width="100%"> <h2 class="relative group"><a id="two-paths" class="header-link block pr-1.5 text-lg no-hover:hidden with-hover:absolute with-hover:p-1.5 with-hover:opacity-0 with-hover:group-hover:opacity-100 with-hover:right-full" href="#two-paths"><span><svg class="" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" role="img" width="1em" height="1em" preserveAspectRatio="xMidYMid meet" viewBox="0 0 256 256"><path d="M167.594 88.393a8.001 8.001 0 0 1 0 11.314l-67.882 67.882a8 8 0 1 1-11.314-11.315l67.882-67.881a8.003 8.003 0 0 1 11.314 0zm-28.287 84.86l-28.284 28.284a40 40 0 0 1-56.567-56.567l28.284-28.284a8 8 0 0 0-11.315-11.315l-28.284 28.284a56 56 0 0 0 79.196 79.197l28.285-28.285a8 8 0 1 0-11.315-11.314zM212.852 43.14a56.002 56.002 0 0 0-79.196 0l-28.284 28.284a8 8 0 1 0 11.314 11.314l28.284-28.284a40 40 0 0 1 56.568 56.567l-28.285 28.285a8 8 0 0 0 11.315 11.314l28.284-28.284a56.065 56.065 0 0 0 0-79.196z" fill="currentColor"></path></svg></span></a> <span>Two paths: choose your own adventure</span></h2> <img src="https://huggingface.co/datasets/huggingface-deep-rl-course/course-images/resolve/main/en/unit0/two-paths.jpg" alt="Two paths" width="100%"> <p data-svelte-h="svelte-1ygf71c">You can choose to follow this course either:</p> <ul data-svelte-h="svelte-186gjk5"><li><em>To get a certificate of completion</em>: you need to complete 80% of the assignments.</li> <li><em>To get a certificate of honors</em>: you need to complete 100% of the assignments.</li> <li><em>As a simple audit</em>: you can participate in all challenges and do assignments if you want.</li></ul> <p data-svelte-h="svelte-1tfwr9k">There’s <strong>no deadlines, the course is self-paced</strong>.
Both paths <strong>are completely free</strong>.
Whatever path you choose, we advise you <strong>to follow the recommended pace to enjoy the course and challenges with your fellow classmates.</strong></p> <p data-svelte-h="svelte-qy3r5p">You don’t need to tell us which path you choose. <strong>If you get more than 80% of the assignments done, you’ll get a certificate.</strong></p> <h2 class="relative group"><a id="certification-process" class="header-link block pr-1.5 text-lg no-hover:hidden with-hover:absolute with-hover:p-1.5 with-hover:opacity-0 with-hover:group-hover:opacity-100 with-hover:right-full" href="#certification-process"><span><svg class="" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" role="img" width="1em" height="1em" preserveAspectRatio="xMidYMid meet" viewBox="0 0 256 256"><path d="M167.594 88.393a8.001 8.001 0 0 1 0 11.314l-67.882 67.882a8 8 0 1 1-11.314-11.315l67.882-67.881a8.003 8.003 0 0 1 11.314 0zm-28.287 84.86l-28.284 28.284a40 40 0 0 1-56.567-56.567l28.284-28.284a8 8 0 0 0-11.315-11.315l-28.284 28.284a56 56 0 0 0 79.196 79.197l28.285-28.285a8 8 0 1 0-11.315-11.314zM212.852 43.14a56.002 56.002 0 0 0-79.196 0l-28.284 28.284a8 8 0 1 0 11.314 11.314l28.284-28.284a40 40 0 0 1 56.568 56.567l-28.285 28.285a8 8 0 0 0 11.315 11.314l28.284-28.284a56.065 56.065 0 0 0 0-79.196z" fill="currentColor"></path></svg></span></a> <span>The Certification Process</span></h2> <p data-svelte-h="svelte-1ybbpoz">The certification process is <strong>completely free</strong>:</p> <ul data-svelte-h="svelte-eoc7ia"><li><em>To get a certificate of completion</em>: you need to complete 80% of the assignments.</li> <li><em>To get a certificate of honors</em>: you need to complete 100% of the assignments.</li></ul> <p data-svelte-h="svelte-13oa6ep">Again, there’s <strong>no deadline</strong> since the course is self paced. But our advice <strong>is to follow the recommended pace section</strong>.</p> <img src="https://huggingface.co/datasets/huggingface-deep-rl-course/course-images/resolve/main/en/unit0/certification.jpg" alt="Course certification" width="100%"> <h2 class="relative group"><a id="advice" class="header-link block pr-1.5 text-lg no-hover:hidden with-hover:absolute with-hover:p-1.5 with-hover:opacity-0 with-hover:group-hover:opacity-100 with-hover:right-full" href="#advice"><span><svg class="" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" role="img" width="1em" height="1em" preserveAspectRatio="xMidYMid meet" viewBox="0 0 256 256"><path d="M167.594 88.393a8.001 8.001 0 0 1 0 11.314l-67.882 67.882a8 8 0 1 1-11.314-11.315l67.882-67.881a8.003 8.003 0 0 1 11.314 0zm-28.287 84.86l-28.284 28.284a40 40 0 0 1-56.567-56.567l28.284-28.284a8 8 0 0 0-11.315-11.315l-28.284 28.284a56 56 0 0 0 79.196 79.197l28.285-28.285a8 8 0 1 0-11.315-11.314zM212.852 43.14a56.002 56.002 0 0 0-79.196 0l-28.284 28.284a8 8 0 1 0 11.314 11.314l28.284-28.284a40 40 0 0 1 56.568 56.567l-28.285 28.285a8 8 0 0 0 11.315 11.314l28.284-28.284a56.065 56.065 0 0 0 0-79.196z" fill="currentColor"></path></svg></span></a> <span>How to get most of the course?</span></h2> <p data-svelte-h="svelte-180fzyv">To get most of the course, we have some advice:</p> <ol data-svelte-h="svelte-128p29f"><li><a href="https://discord.gg/ydHrjt3WP5">Join study groups in Discord </a>: studying in groups is always easier. To do that, you need to join our discord server. If you&#39;re new to Discord, no worries! We have some tools that will help you learn about it.</li> <li><strong>Do the quizzes and assignments</strong>: the best way to learn is to do and test yourself.</li> <li><strong>Define a schedule to stay in sync</strong>: you can use our recommended pace schedule below or create yours.</li></ol> <img src="https://huggingface.co/datasets/huggingface-deep-rl-course/course-images/resolve/main/en/unit0/advice.jpg" alt="Course advice" width="100%"> <h2 class="relative group"><a id="tools" class="header-link block pr-1.5 text-lg no-hover:hidden with-hover:absolute with-hover:p-1.5 with-hover:opacity-0 with-hover:group-hover:opacity-100 with-hover:right-full" href="#tools"><span><svg class="" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" role="img" width="1em" height="1em" preserveAspectRatio="xMidYMid meet" viewBox="0 0 256 256"><path d="M167.594 88.393a8.001 8.001 0 0 1 0 11.314l-67.882 67.882a8 8 0 1 1-11.314-11.315l67.882-67.881a8.003 8.003 0 0 1 11.314 0zm-28.287 84.86l-28.284 28.284a40 40 0 0 1-56.567-56.567l28.284-28.284a8 8 0 0 0-11.315-11.315l-28.284 28.284a56 56 0 0 0 79.196 79.197l28.285-28.285a8 8 0 1 0-11.315-11.314zM212.852 43.14a56.002 56.002 0 0 0-79.196 0l-28.284 28.284a8 8 0 1 0 11.314 11.314l28.284-28.284a40 40 0 0 1 56.568 56.567l-28.285 28.285a8 8 0 0 0 11.315 11.314l28.284-28.284a56.065 56.065 0 0 0 0-79.196z" fill="currentColor"></path></svg></span></a> <span>What tools do I need?</span></h2> <p data-svelte-h="svelte-loeab5">You need only 3 things:</p> <ul data-svelte-h="svelte-7fy04p"><li><em>A computer</em> with an internet connection.</li> <li><em>Google Colab (free version)</em>: most of our hands-on will use Google Colab, the <strong>free version is enough.</strong></li> <li>A <em>Hugging Face Account</em>: to push and load models. If you don’t have an account yet, you can create one <strong><a href="https://hf.co/join" rel="nofollow">here</a></strong> (it’s free).</li></ul> <img src="https://huggingface.co/datasets/huggingface-deep-rl-course/course-images/resolve/main/en/unit0/tools.jpg" alt="Course tools needed" width="100%"> <h2 class="relative group"><a id="recommended-pace" class="header-link block pr-1.5 text-lg no-hover:hidden with-hover:absolute with-hover:p-1.5 with-hover:opacity-0 with-hover:group-hover:opacity-100 with-hover:right-full" href="#recommended-pace"><span><svg class="" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" role="img" width="1em" height="1em" preserveAspectRatio="xMidYMid meet" viewBox="0 0 256 256"><path d="M167.594 88.393a8.001 8.001 0 0 1 0 11.314l-67.882 67.882a8 8 0 1 1-11.314-11.315l67.882-67.881a8.003 8.003 0 0 1 11.314 0zm-28.287 84.86l-28.284 28.284a40 40 0 0 1-56.567-56.567l28.284-28.284a8 8 0 0 0-11.315-11.315l-28.284 28.284a56 56 0 0 0 79.196 79.197l28.285-28.285a8 8 0 1 0-11.315-11.314zM212.852 43.14a56.002 56.002 0 0 0-79.196 0l-28.284 28.284a8 8 0 1 0 11.314 11.314l28.284-28.284a40 40 0 0 1 56.568 56.567l-28.285 28.285a8 8 0 0 0 11.315 11.314l28.284-28.284a56.065 56.065 0 0 0 0-79.196z" fill="currentColor"></path></svg></span></a> <span>What is the recommended pace?</span></h2> <p data-svelte-h="svelte-4wknxl">Each chapter in this course is designed <strong>to be completed in 1 week, with approximately 3-4 hours of work per week</strong>. However, you can take as much time as necessary to complete the course. If you want to dive into a topic more in-depth, we’ll provide additional resources to help you achieve that.</p> <h2 class="relative group"><a id="who-are-we" class="header-link block pr-1.5 text-lg no-hover:hidden with-hover:absolute with-hover:p-1.5 with-hover:opacity-0 with-hover:group-hover:opacity-100 with-hover:right-full" href="#who-are-we"><span><svg class="" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" role="img" width="1em" height="1em" preserveAspectRatio="xMidYMid meet" viewBox="0 0 256 256"><path d="M167.594 88.393a8.001 8.001 0 0 1 0 11.314l-67.882 67.882a8 8 0 1 1-11.314-11.315l67.882-67.881a8.003 8.003 0 0 1 11.314 0zm-28.287 84.86l-28.284 28.284a40 40 0 0 1-56.567-56.567l28.284-28.284a8 8 0 0 0-11.315-11.315l-28.284 28.284a56 56 0 0 0 79.196 79.197l28.285-28.285a8 8 0 1 0-11.315-11.314zM212.852 43.14a56.002 56.002 0 0 0-79.196 0l-28.284 28.284a8 8 0 1 0 11.314 11.314l28.284-28.284a40 40 0 0 1 56.568 56.567l-28.285 28.285a8 8 0 0 0 11.315 11.314l28.284-28.284a56.065 56.065 0 0 0 0-79.196z" fill="currentColor"></path></svg></span></a> <span>Who are we</span></h2> <p data-svelte-h="svelte-1jup2cx">About the author:</p> <ul data-svelte-h="svelte-11w7f8o"><li><a href="https://twitter.com/ThomasSimonini">Thomas Simonini</a> is a Developer Advocate at Hugging Face 🤗 specializing in Deep Reinforcement Learning. He founded the Deep Reinforcement Learning Course in 2018, which became one of the most used courses in Deep RL.</li></ul> <p data-svelte-h="svelte-gd9a5j">About the team:</p> <ul data-svelte-h="svelte-t69p07"><li><a href="https://twitter.com/osanseviero">Omar Sanseviero</a> is a Machine Learning Engineer at Hugging Face where he works in the intersection of ML, Community and Open Source. Previously, Omar worked as a Software Engineer at Google in the teams of Assistant and TensorFlow Graphics. He is from Peru and likes llamas 🦙.</li> <li><a href="https://twitter.com/RisingSayak">Sayak Paul</a> is a Developer Advocate Engineer at Hugging Face. He&#39;s interested in the area of representation learning (self-supervision, semi-supervision, model robustness). And he loves watching crime and action thrillers 🔪.</li></ul> <h2 class="relative group"><a id="challenges" class="header-link block pr-1.5 text-lg no-hover:hidden with-hover:absolute with-hover:p-1.5 with-hover:opacity-0 with-hover:group-hover:opacity-100 with-hover:right-full" href="#challenges"><span><svg class="" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" role="img" width="1em" height="1em" preserveAspectRatio="xMidYMid meet" viewBox="0 0 256 256"><path d="M167.594 88.393a8.001 8.001 0 0 1 0 11.314l-67.882 67.882a8 8 0 1 1-11.314-11.315l67.882-67.881a8.003 8.003 0 0 1 11.314 0zm-28.287 84.86l-28.284 28.284a40 40 0 0 1-56.567-56.567l28.284-28.284a8 8 0 0 0-11.315-11.315l-28.284 28.284a56 56 0 0 0 79.196 79.197l28.285-28.285a8 8 0 1 0-11.315-11.314zM212.852 43.14a56.002 56.002 0 0 0-79.196 0l-28.284 28.284a8 8 0 1 0 11.314 11.314l28.284-28.284a40 40 0 0 1 56.568 56.567l-28.285 28.285a8 8 0 0 0 11.315 11.314l28.284-28.284a56.065 56.065 0 0 0 0-79.196z" fill="currentColor"></path></svg></span></a> <span>What are the challenges in this course?</span></h2> <p data-svelte-h="svelte-11dnki3">In this new version of the course, you have two types of challenges:</p> <ul data-svelte-h="svelte-m7zuak"><li><a href="https://huggingface.co/spaces/huggingface-projects/Deep-Reinforcement-Learning-Leaderboard" rel="nofollow">A leaderboard</a> to compare your agent’s performance to other classmates’.</li> <li><a href="https://huggingface.co/learn/deep-rl-course/unit7/introduction?fw=pt" rel="nofollow">AI vs. AI challenges</a> where you can train your agent and compete against other classmates’ agents.</li></ul> <img src="https://huggingface.co/datasets/huggingface-deep-rl-course/course-images/resolve/main/en/unit0/challenges.jpg" alt="Challenges" width="100%"> <h2 class="relative group"><a id="contribute" class="header-link block pr-1.5 text-lg no-hover:hidden with-hover:absolute with-hover:p-1.5 with-hover:opacity-0 with-hover:group-hover:opacity-100 with-hover:right-full" href="#contribute"><span><svg class="" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" role="img" width="1em" height="1em" preserveAspectRatio="xMidYMid meet" viewBox="0 0 256 256"><path d="M167.594 88.393a8.001 8.001 0 0 1 0 11.314l-67.882 67.882a8 8 0 1 1-11.314-11.315l67.882-67.881a8.003 8.003 0 0 1 11.314 0zm-28.287 84.86l-28.284 28.284a40 40 0 0 1-56.567-56.567l28.284-28.284a8 8 0 0 0-11.315-11.315l-28.284 28.284a56 56 0 0 0 79.196 79.197l28.285-28.285a8 8 0 1 0-11.315-11.314zM212.852 43.14a56.002 56.002 0 0 0-79.196 0l-28.284 28.284a8 8 0 1 0 11.314 11.314l28.284-28.284a40 40 0 0 1 56.568 56.567l-28.285 28.285a8 8 0 0 0 11.315 11.314l28.284-28.284a56.065 56.065 0 0 0 0-79.196z" fill="currentColor"></path></svg></span></a> <span>I found a bug, or I want to improve the course</span></h2> <p data-svelte-h="svelte-uwe8dy">Contributions are welcomed 🤗</p> <ul data-svelte-h="svelte-l3k1ly"><li>If you <em>found a bug 🐛 in a notebook</em>, please <a href="https://github.com/huggingface/deep-rl-class/issues">open an issue</a> and <strong>describe the problem</strong>.</li> <li>If you <em>want to improve the course</em>, you can <a href="https://github.com/huggingface/deep-rl-class/pulls">open a Pull Request.</a></li></ul> <h2 class="relative group"><a id="questions" class="header-link block pr-1.5 text-lg no-hover:hidden with-hover:absolute with-hover:p-1.5 with-hover:opacity-0 with-hover:group-hover:opacity-100 with-hover:right-full" href="#questions"><span><svg class="" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" role="img" width="1em" height="1em" preserveAspectRatio="xMidYMid meet" viewBox="0 0 256 256"><path d="M167.594 88.393a8.001 8.001 0 0 1 0 11.314l-67.882 67.882a8 8 0 1 1-11.314-11.315l67.882-67.881a8.003 8.003 0 0 1 11.314 0zm-28.287 84.86l-28.284 28.284a40 40 0 0 1-56.567-56.567l28.284-28.284a8 8 0 0 0-11.315-11.315l-28.284 28.284a56 56 0 0 0 79.196 79.197l28.285-28.285a8 8 0 1 0-11.315-11.314zM212.852 43.14a56.002 56.002 0 0 0-79.196 0l-28.284 28.284a8 8 0 1 0 11.314 11.314l28.284-28.284a40 40 0 0 1 56.568 56.567l-28.285 28.285a8 8 0 0 0 11.315 11.314l28.284-28.284a56.065 56.065 0 0 0 0-79.196z" fill="currentColor"></path></svg></span></a> <span>I still have questions</span></h2> <p data-svelte-h="svelte-gxcyvw">Please ask your question in our <a href="https://discord.gg/ydHrjt3WP5">discord server #rl-discussions.</a></p> <a class="!text-gray-400 !no-underline text-sm flex items-center not-prose mt-4" href="https://github.com/huggingface/deep-rl-class/blob/main/units/en/unit0/introduction.mdx" target="_blank"><span data-svelte-h="svelte-1kd6by1">&lt;</span> <span data-svelte-h="svelte-x0xyl0">&gt;</span> <span data-svelte-h="svelte-1dajgef"><span class="underline ml-1.5">Update</span> on GitHub</span></a> <p></p>
<script>
{
__sveltekit_18oo4fq = {
assets: "/docs/deep-rl-course/pr_587/en",
base: "/docs/deep-rl-course/pr_587/en",
env: {}
};
const element = document.currentScript.parentElement;
const data = [null,null];
Promise.all([
import("/docs/deep-rl-course/pr_587/en/_app/immutable/entry/start.7c4c7929.js"),
import("/docs/deep-rl-course/pr_587/en/_app/immutable/entry/app.d2a43a08.js")
]).then(([kit, app]) => {
kit.start(app, element, {
node_ids: [0, 6],
data,
form: null,
error: null
});
});
}
</script>

Xet Storage Details

Size:
30.6 kB
·
Xet hash:
f2fd79fe74d332f910f8d6886e736e766b796aaaf422d196a2f52f24ecb525b0

Xet efficiently stores files, intelligently splitting them into unique chunks and accelerating uploads and downloads. More info.