| | license: apache-2.0 |
| | base_model: |
| | - Qwen/Qwen2.5-VL-3B-Instruct |
| | - Qwen/Qwen2.5-VL-7B-Instruct |
| | - lmms-lab/llava-onevision-qwen2-7b-ov |
| | tags: |
| | - robotics |
| | - vision-language-action-model |
| | - vision-language-model |
| | library_name: transformers |
| |
|
| | |
| | repo: InternRobotics/RoboInter-VLM |
| | type: "checkpoint-collection" |
| | description: "Collection of RoboInterVLM checkpoints and configs fine-tuned on RoboInter-VQA." |
| | checkpoints: |
| | - name: RoboInterVLM_qwenvl25_3b |
| | path: RoboInterVLM_qwenvl25_3b/ |
| | notes: "Lightweight Qwen2.5-VL model" |
| | - name: RoboInterVLM_qwenvl25_7b |
| | path: RoboInterVLM_qwenvl25_7b/ |
| | notes: "Stronger performance Qwen2.5-VL backbone" |
| | - name: RoboInterVLM_llava_one_vision_7B |
| | path: RoboInterVLM_llava_one_vision_7B/ |
| | notes: "LLaVA-OneVision (SigLIP + Qwen2) backbone" |
| |
|