Update README.md
Browse files
README.md
CHANGED
|
@@ -317,12 +317,13 @@ cd skywork-r1v/inference
|
|
| 317 |
### 2. Set Up the Environment
|
| 318 |
|
| 319 |
```shell
|
| 320 |
-
conda create -n
|
| 321 |
-
conda activate
|
| 322 |
-
|
| 323 |
```
|
| 324 |
|
| 325 |
### 3. Run the Inference Script
|
|
|
|
| 326 |
|
| 327 |
```shell
|
| 328 |
CUDA_VISIBLE_DEVICES="0,1" python inference_with_transformers.py \
|
|
@@ -330,12 +331,30 @@ CUDA_VISIBLE_DEVICES="0,1" python inference_with_transformers.py \
|
|
| 330 |
--image_paths image1_path \
|
| 331 |
--question "your question"
|
| 332 |
```
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 333 |
|
| 334 |
---
|
| 335 |
|
| 336 |
## 4. Citation
|
| 337 |
If you use Skywork-R1V in your research, please cite:
|
| 338 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 339 |
```
|
| 340 |
@misc{peng2025skyworkr1vpioneeringmultimodal,
|
| 341 |
title={Skywork R1V: Pioneering Multimodal Reasoning with Chain-of-Thought},
|
|
|
|
| 317 |
### 2. Set Up the Environment
|
| 318 |
|
| 319 |
```shell
|
| 320 |
+
conda create -n r1v-vllm python=3.12
|
| 321 |
+
conda activate r1v-vllm
|
| 322 |
+
pip install -U vllm
|
| 323 |
```
|
| 324 |
|
| 325 |
### 3. Run the Inference Script
|
| 326 |
+
# transformers inference
|
| 327 |
|
| 328 |
```shell
|
| 329 |
CUDA_VISIBLE_DEVICES="0,1" python inference_with_transformers.py \
|
|
|
|
| 331 |
--image_paths image1_path \
|
| 332 |
--question "your question"
|
| 333 |
```
|
| 334 |
+
# vllm inference
|
| 335 |
+
```shell
|
| 336 |
+
python inference_with_vllm.py \
|
| 337 |
+
--model_path path \
|
| 338 |
+
--image_paths image1_path image2_path \
|
| 339 |
+
--question "your question" \
|
| 340 |
+
--tensor_parallel_size 4
|
| 341 |
+
```
|
| 342 |
|
| 343 |
---
|
| 344 |
|
| 345 |
## 4. Citation
|
| 346 |
If you use Skywork-R1V in your research, please cite:
|
| 347 |
|
| 348 |
+
```
|
| 349 |
+
@misc{chris2025skyworkr1v2,
|
| 350 |
+
title = {Skywork R1V2: Visual Hybrid Reinforcement Learning for Multimodal Reasoning},
|
| 351 |
+
author = {Chris and Yichen Wei and Peng Yi and Xiaokun Wang and Weijie Qiu and Wei Shen and Tianyidan Xie and Jiangbo Pei and Jianhao Zhang and Yunzhuo Hao and Xuchen Song and Yang Liu and Yahui Zhou},
|
| 352 |
+
year = {2025},
|
| 353 |
+
institution = {Skywork AI, Kunlun Inc.},
|
| 354 |
+
howpublished = {\url{https://github.com/SkyworkAI/Skywork-R1V/blob/main/Skywork_R1V2.pdf}},
|
| 355 |
+
}
|
| 356 |
+
```
|
| 357 |
+
|
| 358 |
```
|
| 359 |
@misc{peng2025skyworkr1vpioneeringmultimodal,
|
| 360 |
title={Skywork R1V: Pioneering Multimodal Reasoning with Chain-of-Thought},
|