umjunsik1323 commited on
Commit
e5c4c96
·
verified ·
1 Parent(s): 4e0fb6c

Update RL Model: Add/Update model 'PPO-CartPole-v1-ep104' and regenerate unified README.md

Browse files
PPO-CartPole-v1-ep104/group1-shard1of1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1137de53a2b312772430094f881336f9e7d83e00dc0dc61a318381b06251b201
3
+ size 69640
PPO-CartPole-v1-ep104/model.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"modelTopology":{"class_name":"Sequential","config":{"name":"sequential_1","layers":[{"class_name":"Dense","config":{"units":128,"activation":"tanh","use_bias":true,"kernel_initializer":{"class_name":"VarianceScaling","config":{"scale":1,"mode":"fan_avg","distribution":"normal","seed":null}},"bias_initializer":{"class_name":"Zeros","config":{}},"kernel_regularizer":null,"bias_regularizer":null,"activity_regularizer":null,"kernel_constraint":null,"bias_constraint":null,"name":"dense_Dense1","trainable":true,"batch_input_shape":[null,4],"dtype":"float32"}},{"class_name":"Dense","config":{"units":128,"activation":"tanh","use_bias":true,"kernel_initializer":{"class_name":"VarianceScaling","config":{"scale":1,"mode":"fan_avg","distribution":"normal","seed":null}},"bias_initializer":{"class_name":"Zeros","config":{}},"kernel_regularizer":null,"bias_regularizer":null,"activity_regularizer":null,"kernel_constraint":null,"bias_constraint":null,"name":"dense_Dense2","trainable":true}},{"class_name":"Dense","config":{"units":2,"activation":"softmax","use_bias":true,"kernel_initializer":{"class_name":"VarianceScaling","config":{"scale":1,"mode":"fan_avg","distribution":"normal","seed":null}},"bias_initializer":{"class_name":"Zeros","config":{}},"kernel_regularizer":null,"bias_regularizer":null,"activity_regularizer":null,"kernel_constraint":null,"bias_constraint":null,"name":"dense_Dense3","trainable":true}}]},"keras_version":"tfjs-layers 4.22.0","backend":"tensor_flow.js"},"weightsManifest":[{"paths":["group1-shard1of1.bin"],"weights":[{"name":"dense_Dense1/kernel","shape":[4,128],"dtype":"float32"},{"name":"dense_Dense1/bias","shape":[128],"dtype":"float32"},{"name":"dense_Dense2/kernel","shape":[128,128],"dtype":"float32"},{"name":"dense_Dense2/bias","shape":[128],"dtype":"float32"},{"name":"dense_Dense3/kernel","shape":[128,2],"dtype":"float32"},{"name":"dense_Dense3/bias","shape":[2],"dtype":"float32"}]}],"agenlusMetadata":{"algorithm":"PPO","episodes":104,"hyperparams":{"gamma":0.99,"lambdaGae":0.95,"clipEpsilon":0.2,"entropyCoef":0.01,"learningRate":0.0003,"epochs":4,"rolloutLen":512,"currentEpsilon":null,"currentAlpha":null},"seed":704946,"seedPinned":true}}
README.md CHANGED
@@ -1,3 +1,36 @@
1
  ---
2
- license: mit
 
 
 
 
3
  ---
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  ---
2
+ library_name: stable-baselines3
3
+ tags:
4
+ - reinforcement-learning
5
+ - deep-reinforcement-learning
6
+ - agenlus
7
  ---
8
+
9
+ # Agenlus Model Hub 🚀
10
+
11
+ Welcome to your Agenlus Reinforcement Learning repository! This repository hosts multiple trained models.
12
+
13
+ ## 📊 Models Summary
14
+
15
+ | Model Name | Environment | Algorithm | Best Score | Episodes | Links |
16
+ | :--- | :--- | :--- | :--- | :--- | :--- |
17
+ | **PPO-CartPole-v1-ep104** | `CartPole-v1` | `PPO` | **45.39** | 104 | [Browse Files](https://huggingface.co/umjunsik1323/RL_Models/tree/main/PPO-CartPole-v1-ep104) |
18
+
19
+ ## 📝 Model Details & Instructions
20
+
21
+ ### 📦 PPO-CartPole-v1-ep104
22
+ * **Environment:** `CartPole-v1`
23
+ * **RL Algorithm:** `PPO`
24
+ * **Best Avg Reward:** `45.39`
25
+ * **Episodes Trained:** `104`
26
+
27
+ **Description:**
28
+ PPO model trained on CartPole-v1 for 104 episodes. Best avg reward: 45.39.
29
+
30
+ **How to load:**
31
+ ```javascript
32
+ const model = await tf.loadLayersModel('https://huggingface.co/umjunsik1323/RL_Models/raw/main/PPO-CartPole-v1-ep104/model.json');
33
+ ```
34
+
35
+ ---
36
+