Update README.md
Browse files
README.md
CHANGED
|
@@ -64,10 +64,15 @@ generated_ids = [
|
|
| 64 |
response = tokenizer.batch_decode(generated_ids, skip_special_tokens=True)[0]
|
| 65 |
```
|
| 66 |
|
| 67 |
-
|
| 68 |
|
| 69 |
If you find our work helpful, feel free to give us a citation.
|
| 70 |
|
| 71 |
```
|
| 72 |
-
|
| 73 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 64 |
response = tokenizer.batch_decode(generated_ids, skip_special_tokens=True)[0]
|
| 65 |
```
|
| 66 |
|
| 67 |
+
## Citation
|
| 68 |
|
| 69 |
If you find our work helpful, feel free to give us a citation.
|
| 70 |
|
| 71 |
```
|
| 72 |
+
@article{zhang2025rlfr,
|
| 73 |
+
title={RLFR: Extending Reinforcement Learning for LLMs with Flow Environment},
|
| 74 |
+
author={Zhang, Jinghao and Zheng, Naishan and Li, Ruilin and Cheng, Dongzhou and Liang, Zheming and Zhao, Feng and Wang, Jiaqi},
|
| 75 |
+
journal={arXiv preprint arXiv:2510.10201},
|
| 76 |
+
year={2025}
|
| 77 |
+
}
|
| 78 |
+
```
|