| license: apache-2.0 |
| base_model: |
| - Qwen/Qwen2.5-VL-3B-Instruct |
| - Qwen/Qwen2.5-VL-7B-Instruct |
| - lmms-lab/llava-onevision-qwen2-7b-ov |
| tags: |
| - robotics |
| - vision-language-action-model |
| - vision-language-model |
| library_name: transformers |
|
|
| |
| repo: InternRobotics/RoboInter-VLM |
| type: "checkpoint-collection" |
| description: "Collection of RoboInterVLM checkpoints and configs fine-tuned on RoboInter-VQA." |
| checkpoints: |
| - name: RoboInterVLM_qwenvl25_3b |
| path: RoboInterVLM_qwenvl25_3b/ |
| notes: "Lightweight Qwen2.5-VL model" |
| - name: RoboInterVLM_qwenvl25_7b |
| path: RoboInterVLM_qwenvl25_7b/ |
| notes: "Stronger performance Qwen2.5-VL backbone" |
| - name: RoboInterVLM_llava_one_vision_7B |
| path: RoboInterVLM_llava_one_vision_7B/ |
| notes: "LLaVA-OneVision (SigLIP + Qwen2) backbone" |
|
|