Update README.md
Browse files
README.md
CHANGED
|
@@ -22,9 +22,18 @@ pipeline_tag: text-generation
|
|
| 22 |
</div>
|
| 23 |
|
| 24 |
<!-- Subtitle -->
|
| 25 |
-
<p style="font-size:
|
| 26 |
Democratizing Reinforcement Learning for LLM Agents
|
| 27 |
</p>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 28 |
</div>
|
| 29 |
|
| 30 |
<div align="center" style="line-height: 1;">
|
|
|
|
| 22 |
</div>
|
| 23 |
|
| 24 |
<!-- Subtitle -->
|
| 25 |
+
<p style="font-size: 0.8em; color: #a1a1aa; margin: 0 0 1em 0; font-family: -apple-system, BlinkMacSystemFont, 'SF Pro Text', sans-serif; line-height: 1.5; font-weight: 400;">
|
| 26 |
Democratizing Reinforcement Learning for LLM Agents
|
| 27 |
</p>
|
| 28 |
+
|
| 29 |
+
<!-- Trained with rLLM Badge -->
|
| 30 |
+
<div style="display: inline-flex; align-items: center; gap: 0.5em; background: rgba(255, 255, 255, 0.1); border: 1px solid rgba(255, 255, 255, 0.2); border-radius: 0.75em; padding: 0.5em 1em; backdrop-filter: blur(0.5em); transition: all 0.3s ease;">
|
| 31 |
+
<svg width="16" height="16" viewBox="0 0 24 24" fill="currentColor" style="color: #ffffff;">
|
| 32 |
+
<path d="M12 0c-6.626 0-12 5.373-12 12 0 5.302 3.438 9.8 8.207 11.387.599.111.793-.261.793-.577v-2.234c-3.338.726-4.033-1.416-4.033-1.416-.546-1.387-1.333-1.756-1.333-1.756-1.089-.745.083-.729.083-.729 1.205.084 1.839 1.237 1.839 1.237 1.07 1.834 2.807 1.304 3.492.997.107-.775.418-1.305.762-1.604-2.665-.305-5.467-1.334-5.467-5.931 0-1.311.469-2.381 1.236-3.221-.124-.303-.535-1.524.117-3.176 0 0 1.008-.322 3.301 1.23.957-.266 1.983-.399 3.003-.404 1.02.005 2.047.138 3.006.404 2.291-1.552 3.297-1.23 3.297-1.23.653 1.653.242 2.874.118 3.176.77.84 1.235 1.911 1.235 3.221 0 4.609-2.807 5.624-5.479 5.921.43.372.823 1.102.823 2.222v3.293c0 .319.192.694.801.576 4.765-1.589 8.199-6.086 8.199-11.386 0-6.627-5.373-12-12-12z"/>
|
| 33 |
+
</svg>
|
| 34 |
+
<span style="font-size: 0.75em; color: #ffffff; font-family: -apple-system, BlinkMacSystemFont, 'SF Pro Text', sans-serif; font-weight: 500; letter-spacing: 0.02em;">Trained with rLLM</span>
|
| 35 |
+
</div>
|
| 36 |
+
|
| 37 |
</div>
|
| 38 |
|
| 39 |
<div align="center" style="line-height: 1;">
|