wli1995 commited on
Commit
49a09e2
·
verified ·
1 Parent(s): 134374c

update axmodel and demo

Browse files
Files changed (43) hide show
  1. README.md +118 -31
  2. internvl3_2b_axmodel/qwen2_p128_l0_together.axmodel +2 -2
  3. internvl3_2b_axmodel/qwen2_p128_l10_together.axmodel +2 -2
  4. internvl3_2b_axmodel/qwen2_p128_l11_together.axmodel +2 -2
  5. internvl3_2b_axmodel/qwen2_p128_l12_together.axmodel +2 -2
  6. internvl3_2b_axmodel/qwen2_p128_l13_together.axmodel +2 -2
  7. internvl3_2b_axmodel/qwen2_p128_l14_together.axmodel +2 -2
  8. internvl3_2b_axmodel/qwen2_p128_l15_together.axmodel +2 -2
  9. internvl3_2b_axmodel/qwen2_p128_l16_together.axmodel +2 -2
  10. internvl3_2b_axmodel/qwen2_p128_l17_together.axmodel +2 -2
  11. internvl3_2b_axmodel/qwen2_p128_l18_together.axmodel +2 -2
  12. internvl3_2b_axmodel/qwen2_p128_l19_together.axmodel +2 -2
  13. internvl3_2b_axmodel/qwen2_p128_l1_together.axmodel +2 -2
  14. internvl3_2b_axmodel/qwen2_p128_l20_together.axmodel +2 -2
  15. internvl3_2b_axmodel/qwen2_p128_l21_together.axmodel +2 -2
  16. internvl3_2b_axmodel/qwen2_p128_l22_together.axmodel +2 -2
  17. internvl3_2b_axmodel/qwen2_p128_l23_together.axmodel +2 -2
  18. internvl3_2b_axmodel/qwen2_p128_l24_together.axmodel +2 -2
  19. internvl3_2b_axmodel/qwen2_p128_l25_together.axmodel +2 -2
  20. internvl3_2b_axmodel/qwen2_p128_l26_together.axmodel +2 -2
  21. internvl3_2b_axmodel/qwen2_p128_l27_together.axmodel +2 -2
  22. internvl3_2b_axmodel/qwen2_p128_l2_together.axmodel +2 -2
  23. internvl3_2b_axmodel/qwen2_p128_l3_together.axmodel +2 -2
  24. internvl3_2b_axmodel/qwen2_p128_l4_together.axmodel +2 -2
  25. internvl3_2b_axmodel/qwen2_p128_l5_together.axmodel +2 -2
  26. internvl3_2b_axmodel/qwen2_p128_l6_together.axmodel +2 -2
  27. internvl3_2b_axmodel/qwen2_p128_l7_together.axmodel +2 -2
  28. internvl3_2b_axmodel/qwen2_p128_l8_together.axmodel +2 -2
  29. internvl3_2b_axmodel/qwen2_p128_l9_together.axmodel +2 -2
  30. internvl3_2b_axmodel/qwen2_post.axmodel +1 -1
  31. main_api_ax650 +2 -2
  32. main_api_axcl_aarch64 +2 -2
  33. main_api_axcl_x86 +2 -2
  34. main_ax650 +2 -2
  35. main_axcl_aarch64 +1 -1
  36. main_axcl_x86 +2 -2
  37. run_internvl_3_2b_448_api_ax650.sh +2 -2
  38. run_internvl_3_2b_448_api_axcl_aarch64.sh +1 -1
  39. run_internvl_3_2b_448_api_axcl_x86.sh +1 -1
  40. run_internvl_3_2b_448_ax650.sh +2 -2
  41. run_internvl_3_2b_448_axcl_aarch64.sh +1 -1
  42. run_internvl_3_2b_448_axcl_x86.sh +2 -2
  43. vit_axmodel/internvl3_2b_vit_slim.axmodel +2 -2
README.md CHANGED
@@ -17,7 +17,7 @@ This version of InternVL3-2B has been converted to run on the Axera NPU using **
17
 
18
  This model has been optimized with the following LoRA:
19
 
20
- Compatible with Pulsar2 version: 3.4
21
 
22
  ## Convert tools links:
23
 
@@ -33,6 +33,7 @@ https://huggingface.co/OpenGVLab/InternVL3-2B
33
  ## Support Platform
34
 
35
  - AX650
 
36
  - [M4N-Dock(爱芯派Pro)](https://wiki.sipeed.com/hardware/zh/maixIV/m4ndock/m4ndock.html)
37
  - [M.2 Accelerator card](https://axcl-docs.readthedocs.io/zh-cn/latest/doc_guide_hardware.html)
38
 
@@ -48,37 +49,38 @@ https://huggingface.co/OpenGVLab/InternVL3-2B
48
  Download all files from this repository to the device.
49
 
50
  ```bash
51
- (base) axera@raspberrypi:~/qtang/huggingface/AXERA-TECH/InternVL3-2B $ tree -L 1
52
  .
53
- ├── config.json
54
- ├── examples
55
- ├── gradio_demo_c_api.py
56
- ├── gradio_demo_python_api.py
57
- ├── infer.py
58
- ├── infer_video.py
59
- ├── internvl3_2b_axmodel
60
- ├── internvl3_2b_tokenizer
61
- ├── internvl3_tokenizer.py
62
- ├── llm.py
63
- ├── main_api_ax650
64
- ├── main_api_axcl_aarch64
65
- ├── main_api_axcl_x86
66
- ├── main_ax650
67
- ├── main_axcl_aarch64
68
- ├── main_axcl_x86
69
- ├── post_config.json
70
- ├── README.md
71
- ├── requirements.txt
72
- ├── run_internvl_3_2b_448_api_ax650.sh
73
- ├── run_internvl_3_2b_448_api_axcl_aarch64.sh
74
- ├── run_internvl_3_2b_448_api_axcl_x86.sh
75
- ├── run_internvl_3_2b_448_ax650.sh
76
- ├── run_internvl_3_2b_448_axcl_aarch64.sh
77
- ├── run_internvl_3_2b_448_axcl_x86.sh
78
- └── vit_axmodel
79
-
80
- 6 directories, 22 files
81
-
 
82
  ```
83
 
84
  ### python env requirement
@@ -136,3 +138,88 @@ HTTP 服务地址: http://xxx.xxx.xxx.xxx:7860
136
  Access `http://xxx.xxx.xxx.xxx:7860` using Chrome or another browser.
137
 
138
  ![](webgui.png)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
17
 
18
  This model has been optimized with the following LoRA:
19
 
20
+ Compatible with Pulsar2 version: 4.2
21
 
22
  ## Convert tools links:
23
 
 
33
  ## Support Platform
34
 
35
  - AX650
36
+ - AX650N DEMO Board
37
  - [M4N-Dock(爱芯派Pro)](https://wiki.sipeed.com/hardware/zh/maixIV/m4ndock/m4ndock.html)
38
  - [M.2 Accelerator card](https://axcl-docs.readthedocs.io/zh-cn/latest/doc_guide_hardware.html)
39
 
 
49
  Download all files from this repository to the device.
50
 
51
  ```bash
52
+ root@ax650:~/huggingface/InternVL3-2B# tree -L 1
53
  .
54
+ |-- README.md
55
+ |-- config.json
56
+ |-- examples
57
+ |-- gradio_demo.py
58
+ |-- gradio_demo_c_api.py
59
+ |-- gradio_demo_python_api.py
60
+ |-- infer.py
61
+ |-- infer_video.py
62
+ |-- internvl3_2b_axmodel
63
+ |-- internvl3_2b_tokenizer
64
+ |-- internvl3_tokenizer.py
65
+ |-- llm.py
66
+ |-- main_api_ax650
67
+ |-- main_api_axcl_aarch64
68
+ |-- main_api_axcl_x86
69
+ |-- main_ax650
70
+ |-- main_axcl_aarch64
71
+ |-- main_axcl_x86
72
+ |-- post_config.json
73
+ |-- requirements.txt
74
+ |-- run_internvl_3_2b_448_api_ax650.sh
75
+ |-- run_internvl_3_2b_448_api_axcl_aarch64.sh
76
+ |-- run_internvl_3_2b_448_api_axcl_x86.sh
77
+ |-- run_internvl_3_2b_448_ax650.sh
78
+ |-- run_internvl_3_2b_448_axcl_aarch64.sh
79
+ |-- run_internvl_3_2b_448_axcl_x86.sh
80
+ |-- vit_axmodel
81
+ `-- webgui.png
82
+
83
+ 4 directories, 24 files
84
  ```
85
 
86
  ### python env requirement
 
138
  Access `http://xxx.xxx.xxx.xxx:7860` using Chrome or another browser.
139
 
140
  ![](webgui.png)
141
+
142
+ #### Inference with AX650 Host, such as M4N-Dock(爱芯派Pro) or AX650N DEMO Board(C++ sample)
143
+ #### Start the Tokenizer service
144
+
145
+ ```
146
+ root@ax650:~/huggingface/InternVL3-2B# python3 internvl3_tokenizer.py
147
+ None None 151645 <|im_end|> 151665 151667
148
+ context_len is 256
149
+ prompt is <|im_start|>system
150
+ 你是书生·万象, 英文名是InternVL, 是由上海人工智能实验室、清华大学及多家合作单位联合开发的多模态大语言模型.<|im_end|
151
+ ...
152
+ http://0.0.0.0:12345
153
+
154
+ ```
155
+ Open another terminal and run `run_internvl_3_2b_448_ax650.sh`
156
+ ```
157
+ root@ax650:~/wangli/huggingface/InternVL3-2B# ./run_internvl_3_2b_448_ax650.sh
158
+ [I][ Init][ 134]: LLM init start
159
+ [I][ Init][ 34]: connect http://0.0.0.0:12345 ok
160
+ bos_id: -1, eos_id: 151645
161
+ img_start_token: 151665
162
+ img_context_token: 151667
163
+ 3% | ██ | 1 / 31 [0.01s<0.37s, 83.33 count/s] tokenizer init ok[I][ Init][ 45]: LLaMaEmbedSelector use mmap
164
+ 6% | ███ | 2 / 31 [0.01s<0.19s, 166.67 count/s] embed_selector init ok
165
+ 100% | ████████████████████████████████ | 31 / 31 [6.26s<6.26s, 4.95 count/s] init post axmodel ok,remain_cmm(7416 MB)[I][ Init][ 226]: IMAGE_CONTEXT_TOKEN: 151667, IMAGE_START_TOKEN: 151665
166
+ [I][ Init][ 251]: image encoder input nchw@float32
167
+ [I][ Init][ 281]: image encoder output float32
168
+
169
+ [I][ Init][ 291]: image_encoder_height : 448, image_encoder_width: 448
170
+ [I][ Init][ 293]: max_token_len : 2559
171
+ [I][ Init][ 296]: kv_cache_size : 256, kv_cache_num: 2559
172
+ [I][ Init][ 304]: prefill_token_num : 128
173
+ [I][ Init][ 308]: grp: 1, prefill_max_token_num : 1
174
+ [I][ Init][ 308]: grp: 2, prefill_max_token_num : 128
175
+ [I][ Init][ 308]: grp: 3, prefill_max_token_num : 256
176
+ [I][ Init][ 308]: grp: 4, prefill_max_token_num : 384
177
+ [I][ Init][ 308]: grp: 5, prefill_max_token_num : 512
178
+ [I][ Init][ 308]: grp: 6, prefill_max_token_num : 640
179
+ [I][ Init][ 308]: grp: 7, prefill_max_token_num : 768
180
+ [I][ Init][ 308]: grp: 8, prefill_max_token_num : 896
181
+ [I][ Init][ 308]: grp: 9, prefill_max_token_num : 1024
182
+ [I][ Init][ 312]: prefill_max_token_num : 1024
183
+ [I][ load_config][ 282]: load config:
184
+ {
185
+ "enable_repetition_penalty": false,
186
+ "enable_temperature": true,
187
+ "enable_top_k_sampling": true,
188
+ "enable_top_p_sampling": false,
189
+ "penalty_window": 20,
190
+ "repetition_penalty": 1.2,
191
+ "temperature": 0.9,
192
+ "top_k": 10,
193
+ "top_p": 0.8
194
+ }
195
+
196
+ [I][ Init][ 321]: LLM init ok
197
+ Type "q" to exit, Ctrl+c to stop current running
198
+ prompt >> 你是谁
199
+ image >>
200
+ [I][ Run][ 551]: input token num : 46, prefill_split_num : 1
201
+ [I][ Run][ 566]: prefill grpid 2
202
+ [I][ Run][ 593]: input_num_token:46
203
+ [I][ Run][ 717]: ttft: 311.26 ms
204
+ 你好!我是商汤科技开发的多模态大模型,英文名叫InternVL。很高兴为你服务!请问有什么可以帮助你的吗?
205
+
206
+ [N][ Run][ 826]: hit eos,avg 10.69 token/s
207
+
208
+ prompt >> 描述一下这张图片
209
+ image >> examples/image_0.jpg
210
+ [I][ Encode][ 415]: image encode time : 408.81 ms, size : 393216
211
+ [I][ Encode][ 524]: idx:0 offset : 49 out_embed.size() : 477696
212
+ [I][ Run][ 551]: input token num : 311, prefill_split_num : 3
213
+ [I][ Run][ 566]: prefill grpid 4
214
+ [I][ Run][ 593]: input_num_token:128
215
+ [I][ Run][ 593]: input_num_token:128
216
+ [I][ Run][ 593]: input_num_token:55
217
+ [I][ Run][ 717]: ttft: 1325.82 ms
218
+ 这张图片展示了一只可爱的红熊猫。红熊猫是一种生活在亚洲森林中的熊科动物,以其红棕色的毛皮和白脸而闻名。图片中的红熊猫正趴在木板上,身体的一部分探出木板,显得有些放松和好奇。它的眼睛圆圆的,黑色的,看起来非常可爱。毛皮主要是棕红色的,耳朵和腹部是白色的,形成了鲜明的对比。背景中可以看到一些树木和绿色的叶子,暗示这可能是在自然的森林环境中拍摄的。整体上,这张图片传达出一种温暖和亲近自然的感觉。
219
+
220
+ [N][ Run][ 826]: hit eos,avg 10.70 token/s
221
+
222
+ prompt >> q
223
+ ```
224
+
225
+
internvl3_2b_axmodel/qwen2_p128_l0_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:566547f9b6a2218381356e0b823879e7bc5a65230e7892bf9b71f35fe5cb544e
3
- size 81352456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31115b997b4dcc41f4c6ba97658016940c3cee17882f55c3075ac22357f7e941
3
+ size 63496708
internvl3_2b_axmodel/qwen2_p128_l10_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:88fcff9f305a53c0c0b8fa22a78c8814e65584b7d8e410b6ee38e1d3167cb498
3
- size 81352456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb2428ad66ec54ce9281e831abe25c3d9e83f89ff3b14066a490dfafe1eeb585
3
+ size 63496708
internvl3_2b_axmodel/qwen2_p128_l11_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c628f4771502574c1c2450da1eabea71afc02bee5cd32a9a6e401603ad4d504b
3
- size 81352456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47d5e607133f7d6addeaffb37d76a56e5969c6d32069730bca151dc9a45f2ed8
3
+ size 63496708
internvl3_2b_axmodel/qwen2_p128_l12_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9912b05faabed02d933000326a7b2dfe9a05f9d4f402892073849145bfe96e50
3
- size 81352456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f224442c6eb37a04b16d2a3c8cad051cc29653ca7c3f547359747fb42b50c09
3
+ size 63496708
internvl3_2b_axmodel/qwen2_p128_l13_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b228900f882b9aea5f0fd410d3e59158cd24527aa0e3e8ac1d3d558645e3fd3d
3
- size 81352456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9586839e6e53343d33c6897a7f7de2a291dca700524a13a34b902e86d987139
3
+ size 63496708
internvl3_2b_axmodel/qwen2_p128_l14_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f7cf8308b9204bd3473897e6d91598d8c4cb7485a4279829119329d2d36a9882
3
- size 81352456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72046dd0e4b9ecba9a7f4091dae8a3f45b054e49dfd3ab609482a2edc019b8d2
3
+ size 63496708
internvl3_2b_axmodel/qwen2_p128_l15_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c39a58dea42b1610070607c5a6d1d7bef8e16edae7183a271ad6f15fc765cab5
3
- size 81352456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9fbec6c5c4f7c9b6b5b2631835bc08620b9763818a0954361ea4bca321941e2
3
+ size 63496708
internvl3_2b_axmodel/qwen2_p128_l16_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae575dfe963704b034503e53a13df2d193baba8df35ccf3fb9ae6082ea95ab67
3
- size 81352456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e57ef1574952fc62a174d0ec45f0230646e816a8246bb50cc935735e1f1a93e
3
+ size 63496708
internvl3_2b_axmodel/qwen2_p128_l17_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1fb23bc6883b8b88524b6d5b8f4f225596b9783c123a3e1b6bc4cc7ec49a98a1
3
- size 81352456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31ee093b10e87b874a92a3a7d57c0e1aed8da199e3bc278e76ef8f6ee2ba1b57
3
+ size 63496708
internvl3_2b_axmodel/qwen2_p128_l18_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:42eaacc99e87a3d9ebc88a5f12f83275285384f977d63e60dd142c4672e5c44a
3
- size 81352456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5dfd9149ee03bc07fc0bd0c9872126d47b341bc04b44f885ae2b8a268a600699
3
+ size 63496708
internvl3_2b_axmodel/qwen2_p128_l19_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:949d0fe12d45244098cc772c3701f0e3173d12a98e3975488d6c16c57059b87e
3
- size 81352456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2da9cd1dc89a16f42e1542891c063e9da117e876b96b5100fc52c030deef5b5
3
+ size 63496708
internvl3_2b_axmodel/qwen2_p128_l1_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fe657b85c98d4139f035675a27466bbc719a884817c0605b74ab95a10aeefe4a
3
- size 81352456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5544c2d489c58cc0044af4690810a1ffc890e29fdab38c9a2c7bd73a089af149
3
+ size 63496708
internvl3_2b_axmodel/qwen2_p128_l20_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:42c7b094b5b693623e81c089da77f5d4f6e665d8262b61dbc1dd110920d719cf
3
- size 81352456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5212839cc201e6ca5e90ff1ec1e9fbf253588dad5ad1c837bcc9053848f25af4
3
+ size 63496708
internvl3_2b_axmodel/qwen2_p128_l21_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fe905b027a9fc0378c9b8c2fad994fd6fe07b50a398ec4be75400efcf38000d1
3
- size 81352456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62c194ef1e7e79b69b83e1175cb2c2bd45cd508dcf9fd4659bd31ee04ef4965a
3
+ size 63496708
internvl3_2b_axmodel/qwen2_p128_l22_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6748d3de2fc7db45d29e8cd0ab76b06404fa1967003dec6671d46ff7f9cdf0d1
3
- size 81352456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e435f31fe0aa2e1ac1bf8fa9aad70d264296d6753ee1b48a19f9f6c6021b135
3
+ size 63496708
internvl3_2b_axmodel/qwen2_p128_l23_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:397bcf99b84b4edcdb9ff8486a99197057c77665c6ca1516cd843c4e7d001e7b
3
- size 81352456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3f1f334bbc2dd2b1290ab726c66f3044bfa184398d6ef7fbe50f48f1398c368
3
+ size 63496708
internvl3_2b_axmodel/qwen2_p128_l24_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:33c2091bb6a07d07093e44f1a6df4e262761281cff20ed7ec934e96c5ff1606d
3
- size 81352456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a327bc245121dd324b3bef6e56398323cdf526f96af469210055e09a5c577336
3
+ size 63496708
internvl3_2b_axmodel/qwen2_p128_l25_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1cb522c7ce3e0252df76108e880ae74951aefd0d0733c36e5423a9ed3d750a6e
3
- size 81352456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1dfc35719298adbd618ca38c4142a42c19ffe580bd49eac1801c55c3ef1ab8b
3
+ size 63496708
internvl3_2b_axmodel/qwen2_p128_l26_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6eea53085ef6d8099137ea9dd7419f3b5ef8714da3cda4096a5adfd82d80d180
3
- size 81352456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:122fb2c087434f4b9d38b8ee2d84c1f60a771d994a1e79ce87303ac0611258e8
3
+ size 63496708
internvl3_2b_axmodel/qwen2_p128_l27_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f76358d0e13a3eb480705a23e11189a0009d0bcd074573fb6d8506406c985bd7
3
- size 81352456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b965d9ce79f24ccf3bb690ab645a8e57acb660e416fb782f6b765103f577018a
3
+ size 63496708
internvl3_2b_axmodel/qwen2_p128_l2_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:016fd2f9b492b3f80d18a4508f3e862742cebbdb9ee0efa21c231fd213dea29c
3
- size 81356136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2cbc9b29068fc8e4b3488704ca9e7f85946b1aea5bbce8e9b6c15eabd801f944
3
+ size 63498820
internvl3_2b_axmodel/qwen2_p128_l3_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8d1bcb6c77421d1e74589a43ed02b8c54fdedd61f97bc64a6a9eefb2bdc87ecb
3
- size 81352456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3ca02b44fda0690ecafa8a36d5a0f4a56ebe6e73702bca84c1089c3fbf548fe
3
+ size 63496708
internvl3_2b_axmodel/qwen2_p128_l4_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a6113220384ffcd4c44f852bdd8c800d1a414f5e4dc2424e6ed97f5e7db5e4d5
3
- size 81352456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daa424dcaa5e2c376a2485c4112f9be6b1c3a7f57dfc01ff25a4eb045ab72270
3
+ size 63496708
internvl3_2b_axmodel/qwen2_p128_l5_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:66ccd095ba921ee9eda510f76836dca192b2827373279226a10447c7e0df54b4
3
- size 81352456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9a4c51af440e9a4f66f4287931779f3bff8efee4fc283368a5e42090d5bb0f7
3
+ size 63496708
internvl3_2b_axmodel/qwen2_p128_l6_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a21872e47517eafcb3c2a1ad0c8b959a627fd4e4dc7a106b35360438bf272c42
3
- size 81352456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e94535ca7805298f78f04275f27f44a20536c84985d78bb2faada5be18b72d96
3
+ size 63496708
internvl3_2b_axmodel/qwen2_p128_l7_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:20698b243c09c869985831c4d63c7d13dd26d194ff596726bbd1010f2882aab2
3
- size 81352456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:890b63d139eafbaf118ca3c203f7cafbac4aef02b2fffacbbe54b215d359d862
3
+ size 63496708
internvl3_2b_axmodel/qwen2_p128_l8_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:447476180d7784b36216c4ac67ba8028a8339a59721ca437145b68c7e95488fb
3
- size 81352456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1435d343d533f375ef4d34859dd8ad6d6885c6d80bebb7852b59ce783d005c31
3
+ size 63496708
internvl3_2b_axmodel/qwen2_p128_l9_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e9f17ec940ee1fac261db4bb3aa9d7c1e98f6c7faa477bd2739816cf82675d15
3
- size 81352456
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9d1d65a56b3727e8c224afae6446d536502e70ce31d003287d37ddba5886722
3
+ size 63496708
internvl3_2b_axmodel/qwen2_post.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:056893588013d412e3b41049c0f87a7eae70670b1992d6f17507d50698b97753
3
  size 254396183
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8246a085a945cb020db3aa7d4da5f94db41573298ef711360acb969a20a542d9
3
  size 254396183
main_api_ax650 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9fc74b9dcf37c2b75d1894fa0f0ecaffe741b11f13a58dda0d30ff1b4ca8d508
3
- size 6667616
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:303579a415049e01b3b4567273797c269dd1a19f36105871a5fec9e7799c64fa
3
+ size 1110872
main_api_axcl_aarch64 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fe28789b7b719911f38e18fbcd38b149ac77f4d75129e8629d7fce1c7b3cddf8
3
- size 1870304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57a72b261f5f9ff9a8b52c6fa239275f7d59940f8391568fe0731b01ce1fc869
3
+ size 1870208
main_api_axcl_x86 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:849231c5e30faa54cf62a55022a45b42ed767a7feb52ea26483e5c70eb9073dd
3
- size 1927840
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3dca142fdb18e4368720ea9b28b6a197745eeec720dd70a544af40fe2a18a7a2
3
+ size 1945760
main_ax650 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2b0bc06d4c78f592ae546a9f91f260dd62da7bf6b41a8f8a24a7a648d58c7f72
3
- size 6568824
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9972226de2a4197e1c89bde89f71803f8621cba4203c4248ab9a715dcff2f906
3
+ size 1014000
main_axcl_aarch64 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:03ff6647009917de1687a84e7601d457e00587af490b54bf1da41b4f0208f691
3
  size 1786544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b4b0ad9be98c900c07d45fd7e421425dda26e9b3a3f0e8666e3f9cf79fce388
3
  size 1786544
main_axcl_x86 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:273bac369315774e6e6df5e725647c49e5356f22cc512f1daadfd58066a37ef0
3
- size 1840560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26530ece559ab78f96a93a8c26e14d5cc84b405d82e86897ce31cf4176677397
3
+ size 1832984
run_internvl_3_2b_448_api_ax650.sh CHANGED
@@ -3,8 +3,8 @@
3
  --axmodel_num 28 \
4
  --filename_image_encoder_axmodedl "./vit_axmodel/internvl3_2b_vit_slim.axmodel" \
5
  --use_mmap_load_embed 1 \
6
- --filename_tokenizer_model "http://0.0.0.0:12345" \
7
  --filename_post_axmodel "./internvl3_2b_axmodel/qwen2_post.axmodel" \
8
- --filename_tokens_embed "./internvl3_2b_axmodel/model.embed_tokens.weight.bf16.bin" \
9
  --tokens_embed_num 151674 \
10
  --tokens_embed_size 1536
 
3
  --axmodel_num 28 \
4
  --filename_image_encoder_axmodedl "./vit_axmodel/internvl3_2b_vit_slim.axmodel" \
5
  --use_mmap_load_embed 1 \
6
+ --url_tokenizer_model "http://0.0.0.0:12345" \
7
  --filename_post_axmodel "./internvl3_2b_axmodel/qwen2_post.axmodel" \
8
+ --filename_tokens_embed "./internvl3_2b_axmodel/model.embed_tokens.weight.bfloat16.bin" \
9
  --tokens_embed_num 151674 \
10
  --tokens_embed_size 1536
run_internvl_3_2b_448_api_axcl_aarch64.sh CHANGED
@@ -3,7 +3,7 @@
3
  --axmodel_num 28 \
4
  --filename_image_encoder_axmodedl "./internvl3_2b_ax650/internvl3_2b_vit.axmodel" \
5
  --use_mmap_load_embed 1 \
6
- --filename_tokenizer_model "http://0.0.0.0:12345" \
7
  --filename_post_axmodel "./internvl3_2b_ax650/qwen2_post.axmodel" \
8
  --filename_tokens_embed "./internvl3_2b_ax650/model.embed_tokens.weight.bfloat16.bin" \
9
  --tokens_embed_num 151674 \
 
3
  --axmodel_num 28 \
4
  --filename_image_encoder_axmodedl "./internvl3_2b_ax650/internvl3_2b_vit.axmodel" \
5
  --use_mmap_load_embed 1 \
6
+ --url_tokenizer_model "http://0.0.0.0:12345" \
7
  --filename_post_axmodel "./internvl3_2b_ax650/qwen2_post.axmodel" \
8
  --filename_tokens_embed "./internvl3_2b_ax650/model.embed_tokens.weight.bfloat16.bin" \
9
  --tokens_embed_num 151674 \
run_internvl_3_2b_448_api_axcl_x86.sh CHANGED
@@ -3,7 +3,7 @@
3
  --axmodel_num 28 \
4
  --filename_image_encoder_axmodedl "./vit_axmodel/internvl3_2b_vit_slim.axmodel" \
5
  --use_mmap_load_embed 1 \
6
- --filename_tokenizer_model "http://0.0.0.0:12345" \
7
  --filename_post_axmodel "./internvl3_2b_axmodel/qwen2_post.axmodel" \
8
  --filename_tokens_embed "./internvl3_2b_axmodel/model.embed_tokens.weight.bf16.bin" \
9
  --tokens_embed_num 151674 \
 
3
  --axmodel_num 28 \
4
  --filename_image_encoder_axmodedl "./vit_axmodel/internvl3_2b_vit_slim.axmodel" \
5
  --use_mmap_load_embed 1 \
6
+ --url_tokenizer_model "http://0.0.0.0:12345" \
7
  --filename_post_axmodel "./internvl3_2b_axmodel/qwen2_post.axmodel" \
8
  --filename_tokens_embed "./internvl3_2b_axmodel/model.embed_tokens.weight.bf16.bin" \
9
  --tokens_embed_num 151674 \
run_internvl_3_2b_448_ax650.sh CHANGED
@@ -3,9 +3,9 @@
3
  --axmodel_num 28 \
4
  --filename_image_encoder_axmodedl "./vit_axmodel/internvl3_2b_vit_slim.axmodel" \
5
  --use_mmap_load_embed 1 \
6
- --filename_tokenizer_model "http://0.0.0.0:12345" \
7
  --filename_post_axmodel "./internvl3_2b_axmodel/qwen2_post.axmodel" \
8
- --filename_tokens_embed "./internvl3_2b_axmodel/model.embed_tokens.weight.bf16.bin" \
9
  --tokens_embed_num 151674 \
10
  --tokens_embed_size 1536 \
11
  --live_print 1
 
3
  --axmodel_num 28 \
4
  --filename_image_encoder_axmodedl "./vit_axmodel/internvl3_2b_vit_slim.axmodel" \
5
  --use_mmap_load_embed 1 \
6
+ --url_tokenizer_model "http://0.0.0.0:12345" \
7
  --filename_post_axmodel "./internvl3_2b_axmodel/qwen2_post.axmodel" \
8
+ --filename_tokens_embed "./internvl3_2b_axmodel/model.embed_tokens.weight.bfloat16.bin" \
9
  --tokens_embed_num 151674 \
10
  --tokens_embed_size 1536 \
11
  --live_print 1
run_internvl_3_2b_448_axcl_aarch64.sh CHANGED
@@ -3,7 +3,7 @@
3
  --axmodel_num 28 \
4
  --filename_image_encoder_axmodedl "./internvl3_2b_ax650/internvl3_2b_vit.axmodel" \
5
  --use_mmap_load_embed 1 \
6
- --filename_tokenizer_model "http://0.0.0.0:12345" \
7
  --filename_post_axmodel "./internvl3_2b_ax650/qwen2_post.axmodel" \
8
  --filename_tokens_embed "./internvl3_2b_ax650/model.embed_tokens.weight.bfloat16.bin" \
9
  --tokens_embed_num 151674 \
 
3
  --axmodel_num 28 \
4
  --filename_image_encoder_axmodedl "./internvl3_2b_ax650/internvl3_2b_vit.axmodel" \
5
  --use_mmap_load_embed 1 \
6
+ --url_tokenizer_model "http://0.0.0.0:12345" \
7
  --filename_post_axmodel "./internvl3_2b_ax650/qwen2_post.axmodel" \
8
  --filename_tokens_embed "./internvl3_2b_ax650/model.embed_tokens.weight.bfloat16.bin" \
9
  --tokens_embed_num 151674 \
run_internvl_3_2b_448_axcl_x86.sh CHANGED
@@ -3,9 +3,9 @@
3
  --axmodel_num 28 \
4
  --filename_image_encoder_axmodedl "./vit_axmodel/internvl3_2b_vit_slim.axmodel" \
5
  --use_mmap_load_embed 1 \
6
- --filename_tokenizer_model "http://0.0.0.0:12345" \
7
  --filename_post_axmodel "./internvl3_2b_axmodel/qwen2_post.axmodel" \
8
- --filename_tokens_embed "./internvl3_2b_axmodel/model.embed_tokens.weight.bf16.bin" \
9
  --tokens_embed_num 151674 \
10
  --tokens_embed_size 1536 \
11
  --devices 0,2,4 \
 
3
  --axmodel_num 28 \
4
  --filename_image_encoder_axmodedl "./vit_axmodel/internvl3_2b_vit_slim.axmodel" \
5
  --use_mmap_load_embed 1 \
6
+ --url_tokenizer_model "http://0.0.0.0:12345" \
7
  --filename_post_axmodel "./internvl3_2b_axmodel/qwen2_post.axmodel" \
8
+ --filename_tokens_embed "./internvl3_2b_axmodel/model.embed_tokens.weight.bfloat16.bin" \
9
  --tokens_embed_num 151674 \
10
  --tokens_embed_size 1536 \
11
  --devices 0,2,4 \
vit_axmodel/internvl3_2b_vit_slim.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6bc177b14c60a52271a8492ac96a961a8a25477840394fea364cb77612c0298b
3
- size 372497620
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90e725427e9743dde93af8aa561b115a233e8db7f75dbb7dfe1d47be439b41d8
3
+ size 373371657