Robotics
Safetensors
vision-language-action-model
Jia-Zeng commited on
Commit
4d56d86
·
verified ·
1 Parent(s): 7db4dd8

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +14 -14
README.md CHANGED
@@ -11,7 +11,7 @@ datasets:
11
 
12
  # InternVLA-A1: Unifying Understanding, Generation and Action for Robotic Manipulation
13
 
14
- <div style="display: flex; justify-content: center; align-items: center; margin: 20px 0;">
15
  <img src="https://huggingface.co/spaces/Jia-Zeng/InternVLA_A1_Media/resolve/main/teaser_internvla-a1.jpg" alt="Teaser Image" style="max-width: 100%; border-radius: 10px; box-shadow: 0 4px 8px rgba(0, 0, 0, 0.1);">
16
  </div>
17
 
@@ -32,7 +32,7 @@ Building upon InternVL3 and Qwen3-VL, we instantiate InternVLA-A1 at 2B and 3B p
32
 
33
  ## 🔑 Key Features
34
 
35
- <div style="display: flex; justify-content: center; align-items: center; margin: 20px 0;">
36
  <img src="https://huggingface.co/spaces/Jia-Zeng/InternVLA_A1_Media/resolve/main/method_InternVLA-A1.png" alt="Teaser Image" style="max-width: 100%; border-radius: 10px; box-shadow: 0 4px 8px rgba(0, 0, 0, 0.1);">
37
  </div>
38
 
@@ -53,25 +53,25 @@ Please refer to our official repo [InternVLA-A1](https://github.com/InternRoboti
53
  <div style="display: flex; flex-direction: column; align-items: center; gap: 5px;">
54
  <!-- First Row -->
55
  <div style="display: flex; justify-content: center; align-items: center; gap: 5px;">
56
- <video controls autoplay loop muted width="250" style="border-radius: 5px; box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1);">
57
  <source src="https://huggingface.co/spaces/Jia-Zeng/InternVLA_A1_Media/resolve/main/express_sorting_complete.mp4" type="video/mp4">
58
  </video>
59
- <video controls autoplay loop muted width="250" style="border-radius: 5px; box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1);">
60
  <source src="https://huggingface.co/spaces/Jia-Zeng/InternVLA_A1_Media/resolve/main/In-motion_Ingredient_Picking_4x.mp4" type="video/mp4">
61
  </video>
62
- <video controls autoplay loop muted width="250" style="border-radius: 5px; box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1);">
63
  <source src="https://huggingface.co/spaces/Jia-Zeng/InternVLA_A1_Media/resolve/main/express_sorting_upright_3.mp4" type="video/mp4">
64
  </video>
65
  </div>
66
  <!-- Second Row -->
67
  <div style="display: flex; justify-content: center; align-items: center; gap: 5px;">
68
- <video controls autoplay loop muted width="250" style="border-radius: 5px; box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1);">
69
  <source src="https://huggingface.co/spaces/Jia-Zeng/InternVLA_A1_Media/resolve/main/express_sorting_inverted_2.mp4" type="video/mp4">
70
  </video>
71
- <video controls autoplay loop muted width="250" style="border-radius: 5px; box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1);">
72
  <source src="https://huggingface.co/spaces/Jia-Zeng/InternVLA_A1_Media/resolve/main/express_sorting_upright_2.mp4" type="video/mp4">
73
  </video>
74
- <video controls autoplay loop muted width="250" style="border-radius: 5px; box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1);">
75
  <source src="https://huggingface.co/spaces/Jia-Zeng/InternVLA_A1_Media/resolve/main/express_sorting_upright_1.mp4" type="video/mp4">
76
  </video>
77
  </div>
@@ -83,25 +83,25 @@ Please refer to our official repo [InternVLA-A1](https://github.com/InternRoboti
83
  <div style="display: flex; flex-direction: column; align-items: center; gap: 5px;">
84
  <!-- First Row -->
85
  <div style="display: flex; justify-content: center; align-items: center; gap: 5px;">
86
- <video controls autoplay loop muted width="250" style="border-radius: 5px; box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1);">
87
  <source src="https://huggingface.co/spaces/Jia-Zeng/InternVLA_A1_Media/resolve/main/zig_bag_4x.mp4" type="video/mp4">
88
  </video>
89
- <video controls autoplay loop muted width="250" style="border-radius: 5px; box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1);">
90
  <source src="https://huggingface.co/spaces/Jia-Zeng/InternVLA_A1_Media/resolve/main/sort_parts_4x.mp4" type="video/mp4">
91
  </video>
92
- <video controls autoplay loop muted width="250" style="border-radius: 5px; box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1);">
93
  <source src="https://huggingface.co/spaces/Jia-Zeng/InternVLA_A1_Media/resolve/main/unscrew_cap_4x.mp4" type="video/mp4">
94
  </video>
95
  </div>
96
  <!-- Second Row -->
97
  <div style="display: flex; justify-content: center; align-items: center; gap: 5px;">
98
- <video controls autoplay loop muted width="250" style="border-radius: 5px; box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1);">
99
  <source src="https://huggingface.co/spaces/Jia-Zeng/InternVLA_A1_Media/resolve/main/wipe_stain_4x.mp4" type="video/mp4">
100
  </video>
101
- <video controls autoplay loop muted width="250" style="border-radius: 5px; box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1);">
102
  <source src="https://huggingface.co/spaces/Jia-Zeng/InternVLA_A1_Media/resolve/main/place_flower_4x.mp4" type="video/mp4">
103
  </video>
104
- <video controls autoplay loop muted width="250" style="border-radius: 5px; box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1);">
105
  <source src="https://huggingface.co/spaces/Jia-Zeng/InternVLA_A1_Media/resolve/main/sweep_trash_4x.mp4" type="video/mp4">
106
  </video>
107
  </div>
 
11
 
12
  # InternVLA-A1: Unifying Understanding, Generation and Action for Robotic Manipulation
13
 
14
+ <div style="display: flex; justify-content: center; align-items: center; margin: 10px 0;">
15
  <img src="https://huggingface.co/spaces/Jia-Zeng/InternVLA_A1_Media/resolve/main/teaser_internvla-a1.jpg" alt="Teaser Image" style="max-width: 100%; border-radius: 10px; box-shadow: 0 4px 8px rgba(0, 0, 0, 0.1);">
16
  </div>
17
 
 
32
 
33
  ## 🔑 Key Features
34
 
35
+ <div style="display: flex; justify-content: center; align-items: center; margin: 10px 0;">
36
  <img src="https://huggingface.co/spaces/Jia-Zeng/InternVLA_A1_Media/resolve/main/method_InternVLA-A1.png" alt="Teaser Image" style="max-width: 100%; border-radius: 10px; box-shadow: 0 4px 8px rgba(0, 0, 0, 0.1);">
37
  </div>
38
 
 
53
  <div style="display: flex; flex-direction: column; align-items: center; gap: 5px;">
54
  <!-- First Row -->
55
  <div style="display: flex; justify-content: center; align-items: center; gap: 5px;">
56
+ <video controls autoplay loop muted width="210" style="border-radius: 5px; box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1);">
57
  <source src="https://huggingface.co/spaces/Jia-Zeng/InternVLA_A1_Media/resolve/main/express_sorting_complete.mp4" type="video/mp4">
58
  </video>
59
+ <video controls autoplay loop muted width="210" style="border-radius: 5px; box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1);">
60
  <source src="https://huggingface.co/spaces/Jia-Zeng/InternVLA_A1_Media/resolve/main/In-motion_Ingredient_Picking_4x.mp4" type="video/mp4">
61
  </video>
62
+ <video controls autoplay loop muted width="210" style="border-radius: 5px; box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1);">
63
  <source src="https://huggingface.co/spaces/Jia-Zeng/InternVLA_A1_Media/resolve/main/express_sorting_upright_3.mp4" type="video/mp4">
64
  </video>
65
  </div>
66
  <!-- Second Row -->
67
  <div style="display: flex; justify-content: center; align-items: center; gap: 5px;">
68
+ <video controls autoplay loop muted width="210" style="border-radius: 5px; box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1);">
69
  <source src="https://huggingface.co/spaces/Jia-Zeng/InternVLA_A1_Media/resolve/main/express_sorting_inverted_2.mp4" type="video/mp4">
70
  </video>
71
+ <video controls autoplay loop muted width="210" style="border-radius: 5px; box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1);">
72
  <source src="https://huggingface.co/spaces/Jia-Zeng/InternVLA_A1_Media/resolve/main/express_sorting_upright_2.mp4" type="video/mp4">
73
  </video>
74
+ <video controls autoplay loop muted width="210" style="border-radius: 5px; box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1);">
75
  <source src="https://huggingface.co/spaces/Jia-Zeng/InternVLA_A1_Media/resolve/main/express_sorting_upright_1.mp4" type="video/mp4">
76
  </video>
77
  </div>
 
83
  <div style="display: flex; flex-direction: column; align-items: center; gap: 5px;">
84
  <!-- First Row -->
85
  <div style="display: flex; justify-content: center; align-items: center; gap: 5px;">
86
+ <video controls autoplay loop muted width="210" style="border-radius: 5px; box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1);">
87
  <source src="https://huggingface.co/spaces/Jia-Zeng/InternVLA_A1_Media/resolve/main/zig_bag_4x.mp4" type="video/mp4">
88
  </video>
89
+ <video controls autoplay loop muted width="210" style="border-radius: 5px; box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1);">
90
  <source src="https://huggingface.co/spaces/Jia-Zeng/InternVLA_A1_Media/resolve/main/sort_parts_4x.mp4" type="video/mp4">
91
  </video>
92
+ <video controls autoplay loop muted width="210" style="border-radius: 5px; box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1);">
93
  <source src="https://huggingface.co/spaces/Jia-Zeng/InternVLA_A1_Media/resolve/main/unscrew_cap_4x.mp4" type="video/mp4">
94
  </video>
95
  </div>
96
  <!-- Second Row -->
97
  <div style="display: flex; justify-content: center; align-items: center; gap: 5px;">
98
+ <video controls autoplay loop muted width="210" style="border-radius: 5px; box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1);">
99
  <source src="https://huggingface.co/spaces/Jia-Zeng/InternVLA_A1_Media/resolve/main/wipe_stain_4x.mp4" type="video/mp4">
100
  </video>
101
+ <video controls autoplay loop muted width="210" style="border-radius: 5px; box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1);">
102
  <source src="https://huggingface.co/spaces/Jia-Zeng/InternVLA_A1_Media/resolve/main/place_flower_4x.mp4" type="video/mp4">
103
  </video>
104
+ <video controls autoplay loop muted width="210" style="border-radius: 5px; box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1);">
105
  <source src="https://huggingface.co/spaces/Jia-Zeng/InternVLA_A1_Media/resolve/main/sweep_trash_4x.mp4" type="video/mp4">
106
  </video>
107
  </div>