Update README.md
Browse files
README.md
CHANGED
|
@@ -40,9 +40,19 @@ This is a trained **PPO agent** for the **LunarLander-v2** environment using Sta
|
|
| 40 |
- Learning rate: 3e-4
|
| 41 |
- Optimizer: Adam
|
| 42 |
|
| 43 |
-
|
|
|
|
|
|
|
|
|
|
| 44 |

|
| 45 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 46 |
## 🛠 Usage
|
| 47 |
|
| 48 |
```python
|
|
@@ -55,20 +65,17 @@ from huggingface_hub import hf_hub_download
|
|
| 55 |
# -------------------------
|
| 56 |
# Environment Setup
|
| 57 |
# -------------------------
|
| 58 |
-
|
| 59 |
-
|
| 60 |
-
|
| 61 |
-
# Environment for evaluation (no render)
|
| 62 |
-
eval_env = Monitor(gym.make("LunarLander-v2"))
|
| 63 |
|
| 64 |
# -------------------------
|
| 65 |
-
# Load pretrained model
|
| 66 |
# -------------------------
|
| 67 |
model_path = hf_hub_download("Vishand03/lunarlander-ppo", "model.zip")
|
| 68 |
model = PPO.load(model_path)
|
| 69 |
|
| 70 |
# -------------------------
|
| 71 |
-
# Run
|
| 72 |
# -------------------------
|
| 73 |
obs, _ = env.reset()
|
| 74 |
done = False
|
|
|
|
| 40 |
- Learning rate: 3e-4
|
| 41 |
- Optimizer: Adam
|
| 42 |
|
| 43 |
+
---
|
| 44 |
+
|
| 45 |
+
## 🎥 Demo (Preview)
|
| 46 |
+
|
| 47 |

|
| 48 |
|
| 49 |
+
---
|
| 50 |
+
|
| 51 |
+
## 🎬 Full Demo Video
|
| 52 |
+
👉 [Watch the full video here](replay.mp4)
|
| 53 |
+
|
| 54 |
+
---
|
| 55 |
+
|
| 56 |
## 🛠 Usage
|
| 57 |
|
| 58 |
```python
|
|
|
|
| 65 |
# -------------------------
|
| 66 |
# Environment Setup
|
| 67 |
# -------------------------
|
| 68 |
+
env = gym.make("LunarLander-v2", render_mode="human") # Human render
|
| 69 |
+
eval_env = Monitor(gym.make("LunarLander-v2")) # Evaluation (no render)
|
|
|
|
|
|
|
|
|
|
| 70 |
|
| 71 |
# -------------------------
|
| 72 |
+
# Load pretrained model
|
| 73 |
# -------------------------
|
| 74 |
model_path = hf_hub_download("Vishand03/lunarlander-ppo", "model.zip")
|
| 75 |
model = PPO.load(model_path)
|
| 76 |
|
| 77 |
# -------------------------
|
| 78 |
+
# Run one episode
|
| 79 |
# -------------------------
|
| 80 |
obs, _ = env.reset()
|
| 81 |
done = False
|