Buckets:

hf-doc-build
/

doc-dev

Files

xet

hf-doc-build/doc-dev / deep-rl-course /pr_587 /en /unit0 /introduction.html

rtrm

about 2 months ago

download

raw

30.6 kB

	<meta charset="utf-8" /><meta name="hf:doc:metadata" content="{"title":"Welcome to the 🤗 Deep Reinforcement Learning Course","local":"introduction","sections":[{"title":"What to expect?","local":"expect","sections":[],"depth":2},{"title":"What does the course look like?","local":"course-look-like","sections":[],"depth":2},{"title":"What’s the syllabus?","local":"syllabus","sections":[],"depth":2},{"title":"Two paths: choose your own adventure","local":"two-paths","sections":[],"depth":2},{"title":"The Certification Process","local":"certification-process","sections":[],"depth":2},{"title":"How to get most of the course?","local":"advice","sections":[],"depth":2},{"title":"What tools do I need?","local":"tools","sections":[],"depth":2},{"title":"What is the recommended pace?","local":"recommended-pace","sections":[],"depth":2},{"title":"Who are we","local":"who-are-we","sections":[],"depth":2},{"title":"What are the challenges in this course?","local":"challenges","sections":[],"depth":2},{"title":"I found a bug, or I want to improve the course","local":"contribute","sections":[],"depth":2},{"title":"I still have questions","local":"questions","sections":[],"depth":2}],"depth":1}">
	<link href="/docs/deep-rl-course/pr_587/en/_app/immutable/assets/0.e3b0c442.css" rel="modulepreload">
	<link rel="modulepreload" href="/docs/deep-rl-course/pr_587/en/_app/immutable/entry/start.7c4c7929.js">
	<link rel="modulepreload" href="/docs/deep-rl-course/pr_587/en/_app/immutable/chunks/scheduler.37c15a92.js">
	<link rel="modulepreload" href="/docs/deep-rl-course/pr_587/en/_app/immutable/chunks/singletons.945d9b5d.js">
	<link rel="modulepreload" href="/docs/deep-rl-course/pr_587/en/_app/immutable/chunks/index.18351ede.js">
	<link rel="modulepreload" href="/docs/deep-rl-course/pr_587/en/_app/immutable/chunks/paths.9ffa1e06.js">
	<link rel="modulepreload" href="/docs/deep-rl-course/pr_587/en/_app/immutable/entry/app.d2a43a08.js">
	<link rel="modulepreload" href="/docs/deep-rl-course/pr_587/en/_app/immutable/chunks/index.7cb9c9b8.js">
	<link rel="modulepreload" href="/docs/deep-rl-course/pr_587/en/_app/immutable/nodes/0.e67798fa.js">
	<link rel="modulepreload" href="/docs/deep-rl-course/pr_587/en/_app/immutable/chunks/each.e59479a4.js">
	<link rel="modulepreload" href="/docs/deep-rl-course/pr_587/en/_app/immutable/nodes/6.b0856558.js">
	<link rel="modulepreload" href="/docs/deep-rl-course/pr_587/en/_app/immutable/chunks/EditOnGithub.858acfec.js"><!-- HEAD_svelte-u9bgzb_START --><meta name="hf:doc:metadata" content="{"title":"Welcome to the 🤗 Deep Reinforcement Learning Course","local":"introduction","sections":[{"title":"What to expect?","local":"expect","sections":[],"depth":2},{"title":"What does the course look like?","local":"course-look-like","sections":[],"depth":2},{"title":"What’s the syllabus?","local":"syllabus","sections":[],"depth":2},{"title":"Two paths: choose your own adventure","local":"two-paths","sections":[],"depth":2},{"title":"The Certification Process","local":"certification-process","sections":[],"depth":2},{"title":"How to get most of the course?","local":"advice","sections":[],"depth":2},{"title":"What tools do I need?","local":"tools","sections":[],"depth":2},{"title":"What is the recommended pace?","local":"recommended-pace","sections":[],"depth":2},{"title":"Who are we","local":"who-are-we","sections":[],"depth":2},{"title":"What are the challenges in this course?","local":"challenges","sections":[],"depth":2},{"title":"I found a bug, or I want to improve the course","local":"contribute","sections":[],"depth":2},{"title":"I still have questions","local":"questions","sections":[],"depth":2}],"depth":1}"><!-- HEAD_svelte-u9bgzb_END --> <p></p> <h1 class="relative group"><a id="introduction" class="header-link block pr-1.5 text-lg no-hover:hidden with-hover:absolute with-hover:p-1.5 with-hover:opacity-0 with-hover:group-hover:opacity-100 with-hover:right-full" href="#introduction"><span><svg class="" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" role="img" width="1em" height="1em" preserveAspectRatio="xMidYMid meet" viewBox="0 0 256 256"><path d="M167.594 88.393a8.001 8.001 0 0 1 0 11.314l-67.882 67.882a8 8 0 1 1-11.314-11.315l67.882-67.881a8.003 8.003 0 0 1 11.314 0zm-28.287 84.86l-28.284 28.284a40 40 0 0 1-56.567-56.567l28.284-28.284a8 8 0 0 0-11.315-11.315l-28.284 28.284a56 56 0 0 0 79.196 79.197l28.285-28.285a8 8 0 1 0-11.315-11.314zM212.852 43.14a56.002 56.002 0 0 0-79.196 0l-28.284 28.284a8 8 0 1 0 11.314 11.314l28.284-28.284a40 40 0 0 1 56.568 56.567l-28.285 28.285a8 8 0 0 0 11.315 11.314l28.284-28.284a56.065 56.065 0 0 0 0-79.196z" fill="currentColor"></path></svg></span></a> <span>Welcome to the 🤗 Deep Reinforcement Learning Course</span></h1> <img src="https://huggingface.co/datasets/huggingface-deep-rl-course/course-images/resolve/main/en/unit0/thumbnail.jpg" alt="Deep RL Course thumbnail" width="100%"> <p data-svelte-h="svelte-lar89z">Welcome to the most fascinating topic in Artificial Intelligence: <strong>Deep Reinforcement Learning</strong>.</p> <p data-svelte-h="svelte-9h5dhu">This course will <strong>teach you about Deep Reinforcement Learning from beginner to expert</strong>. It’s completely free and open-source!</p> <p data-svelte-h="svelte-q5r4ab">In this introduction unit you’ll:</p> <ul data-svelte-h="svelte-iulplw"><li>Learn more about the <strong>course content</strong>.</li> <li><strong>Define the path</strong> you’re going to take (either self-audit or certification process).</li> <li>Learn more about the <strong>AI vs. AI challenges</strong> you’re going to participate in.</li> <li>Learn more <strong>about us</strong>.</li> <li><strong>Create your Hugging Face account</strong> (it’s free).</li> <li><strong>Sign-up to our Discord server</strong>, the place where you can chat with your classmates and us (the Hugging Face team).</li></ul> <p data-svelte-h="svelte-4b3xjd">Let’s get started!</p> <h2 class="relative group"><a id="expect" class="header-link block pr-1.5 text-lg no-hover:hidden with-hover:absolute with-hover:p-1.5 with-hover:opacity-0 with-hover:group-hover:opacity-100 with-hover:right-full" href="#expect"><span><svg class="" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" role="img" width="1em" height="1em" preserveAspectRatio="xMidYMid meet" viewBox="0 0 256 256"><path d="M167.594 88.393a8.001 8.001 0 0 1 0 11.314l-67.882 67.882a8 8 0 1 1-11.314-11.315l67.882-67.881a8.003 8.003 0 0 1 11.314 0zm-28.287 84.86l-28.284 28.284a40 40 0 0 1-56.567-56.567l28.284-28.284a8 8 0 0 0-11.315-11.315l-28.284 28.284a56 56 0 0 0 79.196 79.197l28.285-28.285a8 8 0 1 0-11.315-11.314zM212.852 43.14a56.002 56.002 0 0 0-79.196 0l-28.284 28.284a8 8 0 1 0 11.314 11.314l28.284-28.284a40 40 0 0 1 56.568 56.567l-28.285 28.285a8 8 0 0 0 11.315 11.314l28.284-28.284a56.065 56.065 0 0 0 0-79.196z" fill="currentColor"></path></svg></span></a> <span>What to expect?</span></h2> <p data-svelte-h="svelte-f2qxb3">In this course, you will:</p> <ul data-svelte-h="svelte-kd6znf"><li>📖 Study Deep Reinforcement Learning in <strong>theory and practice.</strong></li> <li>🧑‍💻 Learn to <strong>use famous Deep RL libraries</strong> such as <a href="https://stable-baselines3.readthedocs.io/en/master/" rel="nofollow">Stable Baselines3</a>, <a href="https://github.com/DLR-RM/rl-baselines3-zoo" rel="nofollow">RL Baselines3 Zoo</a>, <a href="https://samplefactory.dev/" rel="nofollow">Sample Factory</a> and <a href="https://github.com/vwxyzjn/cleanrl" rel="nofollow">CleanRL</a>.</li> <li>🤖 <strong>Train agents in unique environments</strong> such as <a href="https://huggingface.co/spaces/ThomasSimonini/SnowballFight" rel="nofollow">SnowballFight</a>, <a href="https://huggingface.co/spaces/ThomasSimonini/Huggy" rel="nofollow">Huggy the Doggo 🐶</a>, <a href="https://vizdoom.cs.put.edu.pl/" rel="nofollow">VizDoom (Doom)</a> and classical ones such as <a href="https://gymnasium.farama.org/environments/atari/space_invaders/" rel="nofollow">Space Invaders</a>, <a href="https://pybullet.org/wordpress/" rel="nofollow">PyBullet</a> and more.</li> <li>💾 Share your <strong>trained agents with one line of code to the Hub</strong> and also download powerful agents from the community.</li> <li>🏆 Participate in challenges where you will <strong>evaluate your agents against other teams. You’ll also get to play against the agents you’ll train.</strong></li> <li>🎓 <strong>Earn a certificate of completion</strong> by completing 80% of the assignments.</li></ul> <p data-svelte-h="svelte-t67g99">And more!</p> <p data-svelte-h="svelte-1xij83d">At the end of this course, <strong>you’ll get a solid foundation from the basics to the SOTA (state-of-the-art) of methods</strong>.</p> <p data-svelte-h="svelte-i91mrq">Don’t forget to <strong><a href="http://eepurl.com/ic5ZUD">sign up to the course</a></strong> (we are collecting your email to be able to <strong>send you the links when each Unit is published and give you information about the challenges and updates).</strong></p> <p data-svelte-h="svelte-a79ye4">Sign up 👉 <a href="http://eepurl.com/ic5ZUD">here</a></p> <h2 class="relative group"><a id="course-look-like" class="header-link block pr-1.5 text-lg no-hover:hidden with-hover:absolute with-hover:p-1.5 with-hover:opacity-0 with-hover:group-hover:opacity-100 with-hover:right-full" href="#course-look-like"><span><svg class="" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" role="img" width="1em" height="1em" preserveAspectRatio="xMidYMid meet" viewBox="0 0 256 256"><path d="M167.594 88.393a8.001 8.001 0 0 1 0 11.314l-67.882 67.882a8 8 0 1 1-11.314-11.315l67.882-67.881a8.003 8.003 0 0 1 11.314 0zm-28.287 84.86l-28.284 28.284a40 40 0 0 1-56.567-56.567l28.284-28.284a8 8 0 0 0-11.315-11.315l-28.284 28.284a56 56 0 0 0 79.196 79.197l28.285-28.285a8 8 0 1 0-11.315-11.314zM212.852 43.14a56.002 56.002 0 0 0-79.196 0l-28.284 28.284a8 8 0 1 0 11.314 11.314l28.284-28.284a40 40 0 0 1 56.568 56.567l-28.285 28.285a8 8 0 0 0 11.315 11.314l28.284-28.284a56.065 56.065 0 0 0 0-79.196z" fill="currentColor"></path></svg></span></a> <span>What does the course look like?</span></h2> <p data-svelte-h="svelte-1ee6w8b">The course is composed of:</p> <ul data-svelte-h="svelte-1ju8ahi"><li><p><em>A theory part</em>: where you learn a <strong>concept in theory</strong>.</p></li> <li><p><em>A hands-on</em>: where you’ll learn <strong>to use famous Deep RL libraries</strong> to train your agents in unique environments. These hands-on will be <strong>Google Colab notebooks with companion tutorial videos</strong> if you prefer learning with video format!</p></li> <li><p><em>Challenges</em>: you’ll get to put your agent to compete against other agents in different challenges. There will also be <a href="https://huggingface.co/spaces/huggingface-projects/Deep-Reinforcement-Learning-Leaderboard" rel="nofollow">a leaderboard</a> for you to compare the agents’ performance.</p></li></ul> <h2 class="relative group"><a id="syllabus" class="header-link block pr-1.5 text-lg no-hover:hidden with-hover:absolute with-hover:p-1.5 with-hover:opacity-0 with-hover:group-hover:opacity-100 with-hover:right-full" href="#syllabus"><span><svg class="" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" role="img" width="1em" height="1em" preserveAspectRatio="xMidYMid meet" viewBox="0 0 256 256"><path d="M167.594 88.393a8.001 8.001 0 0 1 0 11.314l-67.882 67.882a8 8 0 1 1-11.314-11.315l67.882-67.881a8.003 8.003 0 0 1 11.314 0zm-28.287 84.86l-28.284 28.284a40 40 0 0 1-56.567-56.567l28.284-28.284a8 8 0 0 0-11.315-11.315l-28.284 28.284a56 56 0 0 0 79.196 79.197l28.285-28.285a8 8 0 1 0-11.315-11.314zM212.852 43.14a56.002 56.002 0 0 0-79.196 0l-28.284 28.284a8 8 0 1 0 11.314 11.314l28.284-28.284a40 40 0 0 1 56.568 56.567l-28.285 28.285a8 8 0 0 0 11.315 11.314l28.284-28.284a56.065 56.065 0 0 0 0-79.196z" fill="currentColor"></path></svg></span></a> <span>What’s the syllabus?</span></h2> <p data-svelte-h="svelte-oyiyj9">This is the course’s syllabus:</p> <img src="https://huggingface.co/datasets/huggingface-deep-rl-course/course-images/resolve/main/en/unit0/syllabus1.jpg" alt="Syllabus Part 1" width="100%"> <img src="https://huggingface.co/datasets/huggingface-deep-rl-course/course-images/resolve/main/en/unit0/syllabus2.jpg" alt="Syllabus Part 2" width="100%"> <h2 class="relative group"><a id="two-paths" class="header-link block pr-1.5 text-lg no-hover:hidden with-hover:absolute with-hover:p-1.5 with-hover:opacity-0 with-hover:group-hover:opacity-100 with-hover:right-full" href="#two-paths"><span><svg class="" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" role="img" width="1em" height="1em" preserveAspectRatio="xMidYMid meet" viewBox="0 0 256 256"><path d="M167.594 88.393a8.001 8.001 0 0 1 0 11.314l-67.882 67.882a8 8 0 1 1-11.314-11.315l67.882-67.881a8.003 8.003 0 0 1 11.314 0zm-28.287 84.86l-28.284 28.284a40 40 0 0 1-56.567-56.567l28.284-28.284a8 8 0 0 0-11.315-11.315l-28.284 28.284a56 56 0 0 0 79.196 79.197l28.285-28.285a8 8 0 1 0-11.315-11.314zM212.852 43.14a56.002 56.002 0 0 0-79.196 0l-28.284 28.284a8 8 0 1 0 11.314 11.314l28.284-28.284a40 40 0 0 1 56.568 56.567l-28.285 28.285a8 8 0 0 0 11.315 11.314l28.284-28.284a56.065 56.065 0 0 0 0-79.196z" fill="currentColor"></path></svg></span></a> <span>Two paths: choose your own adventure</span></h2> <img src="https://huggingface.co/datasets/huggingface-deep-rl-course/course-images/resolve/main/en/unit0/two-paths.jpg" alt="Two paths" width="100%"> <p data-svelte-h="svelte-1ygf71c">You can choose to follow this course either:</p> <ul data-svelte-h="svelte-186gjk5"><li><em>To get a certificate of completion</em>: you need to complete 80% of the assignments.</li> <li><em>To get a certificate of honors</em>: you need to complete 100% of the assignments.</li> <li><em>As a simple audit</em>: you can participate in all challenges and do assignments if you want.</li></ul> <p data-svelte-h="svelte-1tfwr9k">There’s <strong>no deadlines, the course is self-paced</strong>.
	Both paths <strong>are completely free</strong>.
	Whatever path you choose, we advise you <strong>to follow the recommended pace to enjoy the course and challenges with your fellow classmates.</strong></p> <p data-svelte-h="svelte-qy3r5p">You don’t need to tell us which path you choose. <strong>If you get more than 80% of the assignments done, you’ll get a certificate.</strong></p> <h2 class="relative group"><a id="certification-process" class="header-link block pr-1.5 text-lg no-hover:hidden with-hover:absolute with-hover:p-1.5 with-hover:opacity-0 with-hover:group-hover:opacity-100 with-hover:right-full" href="#certification-process"><span><svg class="" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" role="img" width="1em" height="1em" preserveAspectRatio="xMidYMid meet" viewBox="0 0 256 256"><path d="M167.594 88.393a8.001 8.001 0 0 1 0 11.314l-67.882 67.882a8 8 0 1 1-11.314-11.315l67.882-67.881a8.003 8.003 0 0 1 11.314 0zm-28.287 84.86l-28.284 28.284a40 40 0 0 1-56.567-56.567l28.284-28.284a8 8 0 0 0-11.315-11.315l-28.284 28.284a56 56 0 0 0 79.196 79.197l28.285-28.285a8 8 0 1 0-11.315-11.314zM212.852 43.14a56.002 56.002 0 0 0-79.196 0l-28.284 28.284a8 8 0 1 0 11.314 11.314l28.284-28.284a40 40 0 0 1 56.568 56.567l-28.285 28.285a8 8 0 0 0 11.315 11.314l28.284-28.284a56.065 56.065 0 0 0 0-79.196z" fill="currentColor"></path></svg></span></a> <span>The Certification Process</span></h2> <p data-svelte-h="svelte-1ybbpoz">The certification process is <strong>completely free</strong>:</p> <ul data-svelte-h="svelte-eoc7ia"><li><em>To get a certificate of completion</em>: you need to complete 80% of the assignments.</li> <li><em>To get a certificate of honors</em>: you need to complete 100% of the assignments.</li></ul> <p data-svelte-h="svelte-13oa6ep">Again, there’s <strong>no deadline</strong> since the course is self paced. But our advice <strong>is to follow the recommended pace section</strong>.</p> <img src="https://huggingface.co/datasets/huggingface-deep-rl-course/course-images/resolve/main/en/unit0/certification.jpg" alt="Course certification" width="100%"> <h2 class="relative group"><a id="advice" class="header-link block pr-1.5 text-lg no-hover:hidden with-hover:absolute with-hover:p-1.5 with-hover:opacity-0 with-hover:group-hover:opacity-100 with-hover:right-full" href="#advice"><span><svg class="" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" role="img" width="1em" height="1em" preserveAspectRatio="xMidYMid meet" viewBox="0 0 256 256"><path d="M167.594 88.393a8.001 8.001 0 0 1 0 11.314l-67.882 67.882a8 8 0 1 1-11.314-11.315l67.882-67.881a8.003 8.003 0 0 1 11.314 0zm-28.287 84.86l-28.284 28.284a40 40 0 0 1-56.567-56.567l28.284-28.284a8 8 0 0 0-11.315-11.315l-28.284 28.284a56 56 0 0 0 79.196 79.197l28.285-28.285a8 8 0 1 0-11.315-11.314zM212.852 43.14a56.002 56.002 0 0 0-79.196 0l-28.284 28.284a8 8 0 1 0 11.314 11.314l28.284-28.284a40 40 0 0 1 56.568 56.567l-28.285 28.285a8 8 0 0 0 11.315 11.314l28.284-28.284a56.065 56.065 0 0 0 0-79.196z" fill="currentColor"></path></svg></span></a> <span>How to get most of the course?</span></h2> <p data-svelte-h="svelte-180fzyv">To get most of the course, we have some advice:</p> <ol data-svelte-h="svelte-128p29f"><li><a href="https://discord.gg/ydHrjt3WP5">Join study groups in Discord </a>: studying in groups is always easier. To do that, you need to join our discord server. If you're new to Discord, no worries! We have some tools that will help you learn about it.</li> <li><strong>Do the quizzes and assignments</strong>: the best way to learn is to do and test yourself.</li> <li><strong>Define a schedule to stay in sync</strong>: you can use our recommended pace schedule below or create yours.</li></ol> <img src="https://huggingface.co/datasets/huggingface-deep-rl-course/course-images/resolve/main/en/unit0/advice.jpg" alt="Course advice" width="100%"> <h2 class="relative group"><a id="tools" class="header-link block pr-1.5 text-lg no-hover:hidden with-hover:absolute with-hover:p-1.5 with-hover:opacity-0 with-hover:group-hover:opacity-100 with-hover:right-full" href="#tools"><span><svg class="" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" role="img" width="1em" height="1em" preserveAspectRatio="xMidYMid meet" viewBox="0 0 256 256"><path d="M167.594 88.393a8.001 8.001 0 0 1 0 11.314l-67.882 67.882a8 8 0 1 1-11.314-11.315l67.882-67.881a8.003 8.003 0 0 1 11.314 0zm-28.287 84.86l-28.284 28.284a40 40 0 0 1-56.567-56.567l28.284-28.284a8 8 0 0 0-11.315-11.315l-28.284 28.284a56 56 0 0 0 79.196 79.197l28.285-28.285a8 8 0 1 0-11.315-11.314zM212.852 43.14a56.002 56.002 0 0 0-79.196 0l-28.284 28.284a8 8 0 1 0 11.314 11.314l28.284-28.284a40 40 0 0 1 56.568 56.567l-28.285 28.285a8 8 0 0 0 11.315 11.314l28.284-28.284a56.065 56.065 0 0 0 0-79.196z" fill="currentColor"></path></svg></span></a> <span>What tools do I need?</span></h2> <p data-svelte-h="svelte-loeab5">You need only 3 things:</p> <ul data-svelte-h="svelte-7fy04p"><li><em>A computer</em> with an internet connection.</li> <li><em>Google Colab (free version)</em>: most of our hands-on will use Google Colab, the <strong>free version is enough.</strong></li> <li>A <em>Hugging Face Account</em>: to push and load models. If you don’t have an account yet, you can create one <strong><a href="https://hf.co/join" rel="nofollow">here</a></strong> (it’s free).</li></ul> <img src="https://huggingface.co/datasets/huggingface-deep-rl-course/course-images/resolve/main/en/unit0/tools.jpg" alt="Course tools needed" width="100%"> <h2 class="relative group"><a id="recommended-pace" class="header-link block pr-1.5 text-lg no-hover:hidden with-hover:absolute with-hover:p-1.5 with-hover:opacity-0 with-hover:group-hover:opacity-100 with-hover:right-full" href="#recommended-pace"><span><svg class="" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" role="img" width="1em" height="1em" preserveAspectRatio="xMidYMid meet" viewBox="0 0 256 256"><path d="M167.594 88.393a8.001 8.001 0 0 1 0 11.314l-67.882 67.882a8 8 0 1 1-11.314-11.315l67.882-67.881a8.003 8.003 0 0 1 11.314 0zm-28.287 84.86l-28.284 28.284a40 40 0 0 1-56.567-56.567l28.284-28.284a8 8 0 0 0-11.315-11.315l-28.284 28.284a56 56 0 0 0 79.196 79.197l28.285-28.285a8 8 0 1 0-11.315-11.314zM212.852 43.14a56.002 56.002 0 0 0-79.196 0l-28.284 28.284a8 8 0 1 0 11.314 11.314l28.284-28.284a40 40 0 0 1 56.568 56.567l-28.285 28.285a8 8 0 0 0 11.315 11.314l28.284-28.284a56.065 56.065 0 0 0 0-79.196z" fill="currentColor"></path></svg></span></a> <span>What is the recommended pace?</span></h2> <p data-svelte-h="svelte-4wknxl">Each chapter in this course is designed <strong>to be completed in 1 week, with approximately 3-4 hours of work per week</strong>. However, you can take as much time as necessary to complete the course. If you want to dive into a topic more in-depth, we’ll provide additional resources to help you achieve that.</p> <h2 class="relative group"><a id="who-are-we" class="header-link block pr-1.5 text-lg no-hover:hidden with-hover:absolute with-hover:p-1.5 with-hover:opacity-0 with-hover:group-hover:opacity-100 with-hover:right-full" href="#who-are-we"><span><svg class="" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" role="img" width="1em" height="1em" preserveAspectRatio="xMidYMid meet" viewBox="0 0 256 256"><path d="M167.594 88.393a8.001 8.001 0 0 1 0 11.314l-67.882 67.882a8 8 0 1 1-11.314-11.315l67.882-67.881a8.003 8.003 0 0 1 11.314 0zm-28.287 84.86l-28.284 28.284a40 40 0 0 1-56.567-56.567l28.284-28.284a8 8 0 0 0-11.315-11.315l-28.284 28.284a56 56 0 0 0 79.196 79.197l28.285-28.285a8 8 0 1 0-11.315-11.314zM212.852 43.14a56.002 56.002 0 0 0-79.196 0l-28.284 28.284a8 8 0 1 0 11.314 11.314l28.284-28.284a40 40 0 0 1 56.568 56.567l-28.285 28.285a8 8 0 0 0 11.315 11.314l28.284-28.284a56.065 56.065 0 0 0 0-79.196z" fill="currentColor"></path></svg></span></a> <span>Who are we</span></h2> <p data-svelte-h="svelte-1jup2cx">About the author:</p> <ul data-svelte-h="svelte-11w7f8o"><li><a href="https://twitter.com/ThomasSimonini">Thomas Simonini</a> is a Developer Advocate at Hugging Face 🤗 specializing in Deep Reinforcement Learning. He founded the Deep Reinforcement Learning Course in 2018, which became one of the most used courses in Deep RL.</li></ul> <p data-svelte-h="svelte-gd9a5j">About the team:</p> <ul data-svelte-h="svelte-t69p07"><li><a href="https://twitter.com/osanseviero">Omar Sanseviero</a> is a Machine Learning Engineer at Hugging Face where he works in the intersection of ML, Community and Open Source. Previously, Omar worked as a Software Engineer at Google in the teams of Assistant and TensorFlow Graphics. He is from Peru and likes llamas 🦙.</li> <li><a href="https://twitter.com/RisingSayak">Sayak Paul</a> is a Developer Advocate Engineer at Hugging Face. He's interested in the area of representation learning (self-supervision, semi-supervision, model robustness). And he loves watching crime and action thrillers 🔪.</li></ul> <h2 class="relative group"><a id="challenges" class="header-link block pr-1.5 text-lg no-hover:hidden with-hover:absolute with-hover:p-1.5 with-hover:opacity-0 with-hover:group-hover:opacity-100 with-hover:right-full" href="#challenges"><span><svg class="" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" role="img" width="1em" height="1em" preserveAspectRatio="xMidYMid meet" viewBox="0 0 256 256"><path d="M167.594 88.393a8.001 8.001 0 0 1 0 11.314l-67.882 67.882a8 8 0 1 1-11.314-11.315l67.882-67.881a8.003 8.003 0 0 1 11.314 0zm-28.287 84.86l-28.284 28.284a40 40 0 0 1-56.567-56.567l28.284-28.284a8 8 0 0 0-11.315-11.315l-28.284 28.284a56 56 0 0 0 79.196 79.197l28.285-28.285a8 8 0 1 0-11.315-11.314zM212.852 43.14a56.002 56.002 0 0 0-79.196 0l-28.284 28.284a8 8 0 1 0 11.314 11.314l28.284-28.284a40 40 0 0 1 56.568 56.567l-28.285 28.285a8 8 0 0 0 11.315 11.314l28.284-28.284a56.065 56.065 0 0 0 0-79.196z" fill="currentColor"></path></svg></span></a> <span>What are the challenges in this course?</span></h2> <p data-svelte-h="svelte-11dnki3">In this new version of the course, you have two types of challenges:</p> <ul data-svelte-h="svelte-m7zuak"><li><a href="https://huggingface.co/spaces/huggingface-projects/Deep-Reinforcement-Learning-Leaderboard" rel="nofollow">A leaderboard</a> to compare your agent’s performance to other classmates’.</li> <li><a href="https://huggingface.co/learn/deep-rl-course/unit7/introduction?fw=pt" rel="nofollow">AI vs. AI challenges</a> where you can train your agent and compete against other classmates’ agents.</li></ul> <img src="https://huggingface.co/datasets/huggingface-deep-rl-course/course-images/resolve/main/en/unit0/challenges.jpg" alt="Challenges" width="100%"> <h2 class="relative group"><a id="contribute" class="header-link block pr-1.5 text-lg no-hover:hidden with-hover:absolute with-hover:p-1.5 with-hover:opacity-0 with-hover:group-hover:opacity-100 with-hover:right-full" href="#contribute"><span><svg class="" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" role="img" width="1em" height="1em" preserveAspectRatio="xMidYMid meet" viewBox="0 0 256 256"><path d="M167.594 88.393a8.001 8.001 0 0 1 0 11.314l-67.882 67.882a8 8 0 1 1-11.314-11.315l67.882-67.881a8.003 8.003 0 0 1 11.314 0zm-28.287 84.86l-28.284 28.284a40 40 0 0 1-56.567-56.567l28.284-28.284a8 8 0 0 0-11.315-11.315l-28.284 28.284a56 56 0 0 0 79.196 79.197l28.285-28.285a8 8 0 1 0-11.315-11.314zM212.852 43.14a56.002 56.002 0 0 0-79.196 0l-28.284 28.284a8 8 0 1 0 11.314 11.314l28.284-28.284a40 40 0 0 1 56.568 56.567l-28.285 28.285a8 8 0 0 0 11.315 11.314l28.284-28.284a56.065 56.065 0 0 0 0-79.196z" fill="currentColor"></path></svg></span></a> <span>I found a bug, or I want to improve the course</span></h2> <p data-svelte-h="svelte-uwe8dy">Contributions are welcomed 🤗</p> <ul data-svelte-h="svelte-l3k1ly"><li>If you <em>found a bug 🐛 in a notebook</em>, please <a href="https://github.com/huggingface/deep-rl-class/issues">open an issue</a> and <strong>describe the problem</strong>.</li> <li>If you <em>want to improve the course</em>, you can <a href="https://github.com/huggingface/deep-rl-class/pulls">open a Pull Request.</a></li></ul> <h2 class="relative group"><a id="questions" class="header-link block pr-1.5 text-lg no-hover:hidden with-hover:absolute with-hover:p-1.5 with-hover:opacity-0 with-hover:group-hover:opacity-100 with-hover:right-full" href="#questions"><span><svg class="" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" aria-hidden="true" role="img" width="1em" height="1em" preserveAspectRatio="xMidYMid meet" viewBox="0 0 256 256"><path d="M167.594 88.393a8.001 8.001 0 0 1 0 11.314l-67.882 67.882a8 8 0 1 1-11.314-11.315l67.882-67.881a8.003 8.003 0 0 1 11.314 0zm-28.287 84.86l-28.284 28.284a40 40 0 0 1-56.567-56.567l28.284-28.284a8 8 0 0 0-11.315-11.315l-28.284 28.284a56 56 0 0 0 79.196 79.197l28.285-28.285a8 8 0 1 0-11.315-11.314zM212.852 43.14a56.002 56.002 0 0 0-79.196 0l-28.284 28.284a8 8 0 1 0 11.314 11.314l28.284-28.284a40 40 0 0 1 56.568 56.567l-28.285 28.285a8 8 0 0 0 11.315 11.314l28.284-28.284a56.065 56.065 0 0 0 0-79.196z" fill="currentColor"></path></svg></span></a> <span>I still have questions</span></h2> <p data-svelte-h="svelte-gxcyvw">Please ask your question in our <a href="https://discord.gg/ydHrjt3WP5">discord server #rl-discussions.</a></p> <a class="!text-gray-400 !no-underline text-sm flex items-center not-prose mt-4" href="https://github.com/huggingface/deep-rl-class/blob/main/units/en/unit0/introduction.mdx" target="_blank"><span data-svelte-h="svelte-1kd6by1"><</span> <span data-svelte-h="svelte-x0xyl0">></span> <span data-svelte-h="svelte-1dajgef"><span class="underline ml-1.5">Update</span> on GitHub</span></a> <p></p>

	<script>
	{
	__sveltekit_18oo4fq = {
	assets: "/docs/deep-rl-course/pr_587/en",
	base: "/docs/deep-rl-course/pr_587/en",
	env: {}
	};

	const element = document.currentScript.parentElement;

	const data = [null,null];

	Promise.all([
	import("/docs/deep-rl-course/pr_587/en/_app/immutable/entry/start.7c4c7929.js"),
	import("/docs/deep-rl-course/pr_587/en/_app/immutable/entry/app.d2a43a08.js")
	]).then(([kit, app]) => {
	kit.start(app, element, {
	node_ids: [0, 6],
	data,
	form: null,
	error: null
	});
	});
	}
	</script>

Xet Storage Details

Size:: 30.6 kB
Xet hash:: f2fd79fe74d332f910f8d6886e736e766b796aaaf422d196a2f52f24ecb525b0

Xet efficiently stores files, intelligently splitting them into unique chunks and accelerating uploads and downloads. More info.