wangli commited on Jan 22

Commit

6f04984

verified ·

1 Parent(s): a043a29

Upload c++ demo

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

.gitattributes +31 -0
.infer_axmodel_650.py.swn +0 -0
.infer_axmodel_650.py.swo +0 -0
.infer_axmodel_650.py.swp +0 -0
FastVLM_tokenizer.txt +0 -0
README.md +136 -62
embeds/model.embed_tokens.weight.bfloat16.bin +2 -2
embeds/model.embed_tokens.weight.npy +2 -2
fastvlm_C128_CTX1024_P640_ax620e/image_encoder_512x512_ax620e.axmodel +3 -0
fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l0_together.axmodel +3 -0
fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l10_together.axmodel +3 -0
fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l11_together.axmodel +3 -0
fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l12_together.axmodel +3 -0
fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l13_together.axmodel +3 -0
fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l14_together.axmodel +3 -0
fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l15_together.axmodel +3 -0
fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l16_together.axmodel +3 -0
fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l17_together.axmodel +3 -0
fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l18_together.axmodel +3 -0
fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l19_together.axmodel +3 -0
fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l1_together.axmodel +3 -0
fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l20_together.axmodel +3 -0
fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l21_together.axmodel +3 -0
fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l22_together.axmodel +3 -0
fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l23_together.axmodel +3 -0
fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l2_together.axmodel +3 -0
fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l3_together.axmodel +3 -0
fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l4_together.axmodel +3 -0
fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l5_together.axmodel +3 -0
fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l6_together.axmodel +3 -0
fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l7_together.axmodel +3 -0
fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l8_together.axmodel +3 -0
fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l9_together.axmodel +3 -0
fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_post.axmodel +3 -0
fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l0_together.axmodel +2 -2
fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l10_together.axmodel +2 -2
fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l11_together.axmodel +2 -2
fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l12_together.axmodel +2 -2
fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l13_together.axmodel +2 -2
fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l14_together.axmodel +2 -2
fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l15_together.axmodel +2 -2
fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l16_together.axmodel +2 -2
fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l17_together.axmodel +2 -2
fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l18_together.axmodel +2 -2
fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l19_together.axmodel +2 -2
fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l1_together.axmodel +2 -2
fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l20_together.axmodel +2 -2
fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l21_together.axmodel +2 -2
fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l22_together.axmodel +2 -2
fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l23_together.axmodel +2 -2

.gitattributes CHANGED Viewed

@@ -87,3 +87,34 @@ fastvlm_C128_CTX512_P256_ax620e/llava_qwen2_p128_l9_together.axmodel filter=lfs
 fastvlm_C128_CTX512_P256_ax620e/llava_qwen2_post.axmodel filter=lfs diff=lfs merge=lfs -text
 images/image_1.jpg filter=lfs diff=lfs merge=lfs -text
 images/ssd_horse.jpg filter=lfs diff=lfs merge=lfs -text

 fastvlm_C128_CTX512_P256_ax620e/llava_qwen2_post.axmodel filter=lfs diff=lfs merge=lfs -text
 images/image_1.jpg filter=lfs diff=lfs merge=lfs -text
 images/ssd_horse.jpg filter=lfs diff=lfs merge=lfs -text
+fastvlm_C128_CTX1024_P640_ax620e/image_encoder_512x512_ax620e.axmodel filter=lfs diff=lfs merge=lfs -text
+fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l0_together.axmodel filter=lfs diff=lfs merge=lfs -text
+fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l10_together.axmodel filter=lfs diff=lfs merge=lfs -text
+fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l11_together.axmodel filter=lfs diff=lfs merge=lfs -text
+fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l12_together.axmodel filter=lfs diff=lfs merge=lfs -text
+fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l13_together.axmodel filter=lfs diff=lfs merge=lfs -text
+fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l14_together.axmodel filter=lfs diff=lfs merge=lfs -text
+fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l15_together.axmodel filter=lfs diff=lfs merge=lfs -text
+fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l16_together.axmodel filter=lfs diff=lfs merge=lfs -text
+fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l17_together.axmodel filter=lfs diff=lfs merge=lfs -text
+fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l18_together.axmodel filter=lfs diff=lfs merge=lfs -text
+fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l19_together.axmodel filter=lfs diff=lfs merge=lfs -text
+fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l1_together.axmodel filter=lfs diff=lfs merge=lfs -text
+fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l20_together.axmodel filter=lfs diff=lfs merge=lfs -text
+fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l21_together.axmodel filter=lfs diff=lfs merge=lfs -text
+fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l22_together.axmodel filter=lfs diff=lfs merge=lfs -text
+fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l23_together.axmodel filter=lfs diff=lfs merge=lfs -text
+fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l2_together.axmodel filter=lfs diff=lfs merge=lfs -text
+fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l3_together.axmodel filter=lfs diff=lfs merge=lfs -text
+fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l4_together.axmodel filter=lfs diff=lfs merge=lfs -text
+fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l5_together.axmodel filter=lfs diff=lfs merge=lfs -text
+fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l6_together.axmodel filter=lfs diff=lfs merge=lfs -text
+fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l7_together.axmodel filter=lfs diff=lfs merge=lfs -text
+fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l8_together.axmodel filter=lfs diff=lfs merge=lfs -text
+fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l9_together.axmodel filter=lfs diff=lfs merge=lfs -text
+fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_post.axmodel filter=lfs diff=lfs merge=lfs -text
+fastvlm_tokenizer/tokenizer.json filter=lfs diff=lfs merge=lfs -text
+main_ax650 filter=lfs diff=lfs merge=lfs -text
+main_ax650_api filter=lfs diff=lfs merge=lfs -text
+main_axcl_x86 filter=lfs diff=lfs merge=lfs -text
+main_axcl_x86_api filter=lfs diff=lfs merge=lfs -text

.infer_axmodel_650.py.swn ADDED Viewed

Binary file (16.4 kB). View file

.infer_axmodel_650.py.swo ADDED Viewed

Binary file (20.5 kB). View file

.infer_axmodel_650.py.swp ADDED Viewed

Binary file (20.5 kB). View file

FastVLM_tokenizer.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

README.md CHANGED Viewed

@@ -38,7 +38,8 @@ How to Convert LLM from Huggingface to axmodel[TODO]
 |Chips|image encoder|ttft|w4a16|
 |--|--|--|--|
-|AX650N| 44.572 ms (512x512)| 94.532 ms (99tokens)| 34.81 tokens/sec|
 |AX630C| 205.961 ms (512x512)| 489.013 ms (99tokens)| 11.67 tokens/sec|
@@ -49,19 +50,29 @@ Download all files from this repository to the device
 ```
 $tree -L 1
 .
-|-- README.md
-|-- config.json
-|-- embeds
-|-- fastvlm_C128_CTX1024_P640_ax650
-|-- fastvlm_C128_CTX512_P256_ax620e
-|-- fastvlm_tokenizer
-|-- images
-|-- infer_axmodel_620e.py
-|-- infer_axmodel_650.py
-|-- requirements.txt
-`-- utils
-6 directories, 5 files
 ```
 #### Install transformer
@@ -70,125 +81,188 @@ $tree -L 1
 pip install -r requirements.txt
 ```
-#### Inference with AX630C Host
 Run the following command on the Axera board to start a chat conversation:
-```sh
-python3 infer_axmodel_620e.py -v ./fastvlm_C128_CTX512_P256_ax620e/image_encoder_512x512_ax620e.axmodel -m ./fastvlm_C128_CTX512_P256_ax620e -t fastvlm_tokenizer -i 512
 ```
-output:
 ```
-[INFO] Available providers:  ['AxEngineExecutionProvider']
 Loading config, tokenizer and init model.
 [INFO] Using provider: AxEngineExecutionProvider
-[INFO] Chip type: ChipType.MC20E
 [INFO] VNPU type: VNPUType.DISABLED
-[INFO] Engine version: 2.7.2a
-[INFO] Model type: 1 (full core)
 [INFO] Compiler version: 5.1-patch1-dirty 0a5b164f-dirty
 Detected prefixes: ['llava_qwen2'], chosen: llava_qwen2, layers: 24
 Init InferenceSession:   0%|                                                                                                                          | 0/24 [00:00<?, ?it/s][INFO] Using provider: AxEngineExecutionProvider
-[INFO] Model type: 1 (full core)
 [INFO] Compiler version: 5.1-patch1-dirty 0a5b164f-dirty
-Init InferenceSession:   4%|████▊                                                                                                             | 1/24
-[00:02<00:00,  9.25it/s]
-...
 [INFO] Using provider: AxEngineExecutionProvider
-[INFO] Model type: 1 (full core)
 [INFO] Compiler version: 5.1-patch1-dirty 0a5b164f-dirty
-Init InferenceSession: 100%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 24/24 [00:02<00:00,  9.12it/s]
 [INFO] Using provider: AxEngineExecutionProvider
-[INFO] Model type: 1 (full core)
 [INFO] Compiler version: 5.1-patch1-dirty 0a5b164f-dirty
 Model loaded successfully!
 [INFO]: 输入文本进行对话，或者输入图片路径进行图片理解, 或者输入q退出对话。
 prompt<<who are you
 slice_indices: [0]
 Slice prefill done: 0
-answer >> I'm an AI language model, I don't have personal identity or a physical body. I exist solely as a digital creation created by Apple. I don't have a name or a personal identity. I'm designed to assist and provide information to users. Is there anything else I can help you with?
 prompt<<./images/ssd_horse.jpg
 slice_indices: [0]
 Slice prefill done: 0
-answer >> The image depicts a person riding a brown horse with a white blaze on its face. The rider is wearing a blue hoodie and blue jeans, and is holding the reins of the horse. The horse is standing on a dirt ground with some grass and trees in the background. The rider is also holding a rope in their left hand, which is attached to the horse's harness.
-To the left of the horse, there is a brown dog standing on the ground, looking up at the rider. The dog appears to be in a begging or pleading position, with its front paws raised and its mouth open.
-In the background, there is a gray pickup truck parked on the grass, and a wooden fence can be seen behind the horse and rider. There are also some people visible in the background, including a person in a red shirt and another person in a blue shirt. The overall scene appears to be taking place in an outdoor setting, possibly a ranch or a farm.
 prompt<<./images/image_1.jpg
 slice_indices: [0]
 Slice prefill done: 0
-answer >> The image depicts a panda bear in a naturalistic enclosure, likely within a zoo or wildlife sanctuary. The panda is sitting on its hind legs, with its front paws resting on a wooden structure that resembles a tree stump. The panda's distinctive black and white fur is clearly visible, with the black fur covering its ears, eyes, and the area around its nose and mouth, while the white fur covers the rest of its body. The panda's black nose and the black fur around its mouth are also visible.
-The panda is surrounded by green foliage, including bamboo shoots and other plants, which are typical of a panda's natural habitat. The ground appears to be covered with dirt and small rocks, and there are some larger rocks and a tree stump in the background. The lighting in the image suggests that it was taken during the daytime, with natural light illuminating the scene. The overall setting appears to be a well-maintained and naturalistic enclosure designed to mimic the panda's natural environment.
 prompt<<q
 [INFO]: 对话结束，再见。
 ```
-#### Inference with AX650 Host, such as M4N-Dock(爱芯派Pro) or AX650 DEMO Board
 Run the following command on the Axera board to start a chat conversation:
 ```sh
-$ python3 infer_axmodel_650.py -v ./fastvlm_C128_CTX1024_P640_ax650/image_encoder_512x512_0.5b_ax650.axmodel -m ./fastvlm_C128_CTX1024_P640_ax650 -t fastvlm_tokenizer -i 512
 ```
-output:
-```bash
-[INFO] Available providers:  ['AxEngineExecutionProvider', 'AXCLRTExecutionProvider']
 Loading config, tokenizer and init model.
 [INFO] Using provider: AxEngineExecutionProvider
-[INFO] Chip type: ChipType.MC50
 [INFO] VNPU type: VNPUType.DISABLED
-[INFO] Engine version: 2.12.0s
-[INFO] Model type: 2 (triple core)
 [INFO] Compiler version: 5.1-patch1-dirty 0a5b164f-dirty
 Detected prefixes: ['llava_qwen2'], chosen: llava_qwen2, layers: 24
 Init InferenceSession:   0%|                                                                                                                          | 0/24 [00:00<?, ?it/s][INFO] Using provider: AxEngineExecutionProvider
-[INFO] Model type: 2 (triple core)
 [INFO] Compiler version: 5.1-patch1-dirty 0a5b164f-dirty
 [INFO] Using provider: AxEngineExecutionProvider
-[INFO] Model type: 2 (triple core)
-[INFO] Compiler version: 5.1-patch1-dirty 0a5b164f-dirty
-Init InferenceSession:   8%|█████████▌                                                                                                        | 2/24 [00:00<00:01, 17.39it/s][INFO] Using provider: AxEngineExecutionProvider
-[INFO] Model type: 2 (triple core)
 [INFO] Compiler version: 5.1-patch1-dirty 0a5b164f-dirty
 [INFO] Using provider: AxEngineExecutionProvider
-...
-Init InferenceSession: 100%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 24/24 [00:00<00:00, 24.30it/s]
-[INFO] Using provider: AxEngineExecutionProvider
-[INFO] Model type: 2 (triple core)
 [INFO] Compiler version: 5.1-patch1-dirty 0a5b164f-dirty
 Model loaded successfully!
 [INFO]: 输入文本进行对话，或者输入图片路径进行图片理解, 或者输入q退出对话。
 prompt<<who are you
 slice_indices: [0]
 Slice prefill done: 0
-answer >> I'm an AI language model, I don't have personal identity or a physical body. I exist solely as a digital entity designed to assist and provide information to users. I don't have a name or a personal identity, but I can provide information and answer questions based on my training data and algorithms. Is there something specific you would like to know about me?
 prompt<<./images/ssd_horse.jpg
 slice_indices: [0]
 Slice prefill done: 0
-answer >> The image depicts a person riding a brown horse with a white blaze on its face. The rider is wearing a gray hoodie and blue jeans, and is holding the reins of the horse. The horse is standing on a dirt ground with some grass and trees in the background.
-To the left of the horse, there is a brown dog sitting on the ground. The dog is looking up at the rider with its mouth open, as if it is begging or reacting to something.
-In the background, there is a gray pickup truck parked on the grass, and a person wearing a red shirt and blue jeans is standing near the truck. There is also a wooden fence and some trees in the background.
-The overall scene appears to be taking place in a rural or outdoor setting, possibly a farm or ranch.
 prompt<<./images/image_1.jpg
 slice_indices: [0]
 Slice prefill done: 0
-answer >> The image depicts a panda bear in a naturalistic enclosure, likely within a zoo or wildlife sanctuary. The panda is lying on its stomach with its head resting on its front paws, appearing relaxed and content. The panda's distinctive black and white fur is clearly visible, with the black fur covering its ears, eyes, and limbs, while the white fur covers its face, neck, and the underside of its body. The panda's black nose and mouth are also visible.
-The panda is surrounded by green foliage, including bamboo shoots and other plants, which are typical of a panda's natural habitat. In the background, there is a wooden structure that resembles a tree stump or a small tree, adding to the naturalistic setting. The ground is covered with dirt and leaves, further emphasizing the natural environment.
-The lighting in the image is natural, suggesting that the photo was taken during the day. The overall scene conveys a sense of tranquility and the panda's comfort in its environment.
 prompt<<q
 [INFO]: 对话结束，再见。

 |Chips|image encoder|ttft|w4a16|
 |--|--|--|--|
+|AX650N| 59.83 ms (512x512)| 76.36 ms (100tokens)| 34.81 tokens/sec|
+|AXCL x86| 51.80 ms (512x512)| 145.05 ms (93tokens)| 17.40 tokens/sec|
 |AX630C| 205.961 ms (512x512)| 489.013 ms (99tokens)| 11.67 tokens/sec|
 ```
 $tree -L 1
 .
+├── config.json
+├── embeds
+├── fastvlm_C128_CTX1024_P640_ax620e
+├── fastvlm_C128_CTX1024_P640_ax650
+├── fastvlm_tokenizer
+├── FastVLM_tokenizer.txt
+├── images
+├── infer_axmodel_620e.py
+├── infer_axmodel_650.py
+├── main_ax650
+├── main_ax650_api
+├── main_axcl_x86
+├── main_axcl_x86_api
+├── post_config.json
+├── README.md
+├── requirements.txt
+├── run_ax650_512.sh
+├── run_ax650_api.sh
+├── run_axcl_x86_api.sh
+├── run_axcl_x86.sh
+└── utils
+7 directories, 15 files
 ```
 #### Install transformer
 pip install -r requirements.txt
 ```
+#### Inference with AX650 Host, such as M4N-Dock(爱芯派Pro) or AX650 DEMO Board
 Run the following command on the Axera board to start a chat conversation:
+```
+root@ax650:~/FastVLM-0.5B# ./run_ax650_512.sh
+[I][                            Init][ 134]: LLM init start
+tokenizer_type = 3
+stop_tokens size: 2
+151645
+151645
+  7% | ███                               |   2 /  27 [1.06s<14.26s, 1.89 count/s] embed_selector init ok
+100% | ████████████████████████████████ |  27 /  27 [2.35s<2.35s, 11.51 count/s] init post axmodel ok,remain_cmm(9222 MB)[I][                            Init][ 252]: IMAGE_CONTEXT_TOKEN: 151646
+[I][                            Init][ 284]: image encoder input nhwc@uint8
+[I][                            Init][ 308]: image encoder output float32
+[I][                            Init][ 318]: image_encoder_height : 512, image_encoder_width: 512
+[I][                            Init][ 320]: max_token_len : 1024
+[I][                            Init][ 323]: kv_cache_size : 128, kv_cache_num: 1024
+[I][                            Init][ 331]: prefill_token_num : 128
+[I][                            Init][ 335]: grp: 1, prefill_max_token_num : 1
+[I][                            Init][ 335]: grp: 2, prefill_max_token_num : 128
+[I][                            Init][ 335]: grp: 3, prefill_max_token_num : 256
+[I][                            Init][ 335]: grp: 4, prefill_max_token_num : 512
+[I][                            Init][ 335]: grp: 5, prefill_max_token_num : 640
+[I][                            Init][ 339]: prefill_max_token_num : 640
+[I][                     load_config][ 282]: load config:
+{
+    "enable_repetition_penalty": false,
+    "enable_temperature": true,
+    "enable_top_k_sampling": true,
+    "enable_top_p_sampling": false,
+    "penalty_window": 30,
+    "repetition_penalty": 2,
+    "temperature": 0.1,
+    "top_k": 10,
+    "top_p": 0.8
+}
+[I][                            Init][ 348]: LLM init ok
+Type "q" to exit, Ctrl+c to stop current running
+prompt >> who are you
+image >>
+[I][                          Encode][ 470]: input_ids size: 33
+[I][                             Run][ 604]: input token num : 33, prefill_split_num : 1
+[I][                             Run][ 619]: prefill grpid 2
+[I][                             Run][ 646]: input_num_token:33
+[I][                             Run][ 770]: ttft: 76.40 ms
+I am a language model created by Apple Inc. I am designed to assist users in generating human-like text based on the input they provide. I can understand and generate text based on the context and the input provided by the user. I am not capable of generating human-like text, but I can generate text based on the context and the input provided by the user.
+[N][                             Run][ 879]: hit eos,avg 31.22 token/s
+prompt >> describe the image.
+image >> ./images/image_1.jpg
+[I][                          Encode][ 442]: image encode time : 59.83 ms, size : 57344
+[I][                          Encode][ 496]: imgs_embed.size() : 1, media token size : 64
+[I][                             Run][ 604]: input token num : 100, prefill_split_num : 1
+[I][                             Run][ 619]: prefill grpid 2
+[I][                             Run][ 646]: input_num_token:100
+[I][                             Run][ 770]: ttft: 76.36 ms
+The image depicts a panda bear in a naturalistic enclosure, likely within a zoo or wildlife sanctuary. The panda is lying on its stomach with its head resting on a log, appearing relaxed and content. The panda's distinctive black and white fur is clearly visible, with its black ears, eyes, and nose contrasting against its white face and body. The enclosure is surrounded by greenery, including bamboo and other plants, which adds to the natural habitat feel of the scene. The panda appears to be in a comfortable and secure environment, with ample space to move around and interact with its surroundings.
+[N][                             Run][ 879]: hit eos,avg 31.30 token/s
+prompt >> q
 ```
+```sh
+$ python3 infer_axmodel_650.py -v ./fastvlm_C128_CTX1024_P640_ax650/image_encoder_512x512_0.5b_ax650.axmodel -m ./fastvlm_C128_CTX1024_P640_ax650 -t fastvlm_tokenizer -i 512
 ```
+output:
+```bash
+[INFO] Available providers:  ['AxEngineExecutionProvider', 'AXCLRTExecutionProvider']
 Loading config, tokenizer and init model.
 [INFO] Using provider: AxEngineExecutionProvider
+[INFO] Chip type: ChipType.MC50
 [INFO] VNPU type: VNPUType.DISABLED
+[INFO] Engine version: 2.12.0s
+[INFO] Model type: 2 (triple core)
 [INFO] Compiler version: 5.1-patch1-dirty 0a5b164f-dirty
 Detected prefixes: ['llava_qwen2'], chosen: llava_qwen2, layers: 24
 Init InferenceSession:   0%|                                                                                                                          | 0/24 [00:00<?, ?it/s][INFO] Using provider: AxEngineExecutionProvider
+[INFO] Model type: 2 (triple core)
 [INFO] Compiler version: 5.1-patch1-dirty 0a5b164f-dirty
 [INFO] Using provider: AxEngineExecutionProvider
+[INFO] Model type: 2 (triple core)
+[INFO] Compiler version: 5.1-patch1-dirty 0a5b164f-dirty
+Init InferenceSession:   8%|█████████▌                                                                                                        | 2/24 [00:00<00:01, 17.39it/s][INFO] Using provider: AxEngineExecutionProvider
+[INFO] Model type: 2 (triple core)
 [INFO] Compiler version: 5.1-patch1-dirty 0a5b164f-dirty
 [INFO] Using provider: AxEngineExecutionProvider
+...
+Init InferenceSession: 100%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 24/24 [00:00<00:00, 24.30it/s]
+[INFO] Using provider: AxEngineExecutionProvider
+[INFO] Model type: 2 (triple core)
 [INFO] Compiler version: 5.1-patch1-dirty 0a5b164f-dirty
 Model loaded successfully!
 [INFO]: 输入文本进行对话，或者输入图片路径进行图片理解, 或者输入q退出对话。
 prompt<<who are you
 slice_indices: [0]
 Slice prefill done: 0
+answer >> I'm an AI language model, I don't have personal identity or a physical body. I exist solely as a digital entity designed to assist and provide information to users. I don't have a name or a personal identity, but I can provide information and answer questions based on my training data and algorithms. Is there something specific you would like to know about me?
 prompt<<./images/ssd_horse.jpg
 slice_indices: [0]
 Slice prefill done: 0
+answer >> The image depicts a person riding a brown horse with a white blaze on its face. The rider is wearing a gray hoodie and blue jeans, and is holding the reins of the horse. The horse is standing on a dirt ground with some grass and trees in the background.
+To the left of the horse, there is a brown dog sitting on the ground. The dog is looking up at the rider with its mouth open, as if it is begging or reacting to something.
+In the background, there is a gray pickup truck parked on the grass, and a person wearing a red shirt and blue jeans is standing near the truck. There is also a wooden fence and some trees in the background.
+The overall scene appears to be taking place in a rural or outdoor setting, possibly a farm or ranch.
 prompt<<./images/image_1.jpg
 slice_indices: [0]
 Slice prefill done: 0
+answer >> The image depicts a panda bear in a naturalistic enclosure, likely within a zoo or wildlife sanctuary. The panda is lying on its stomach with its head resting on its front paws, appearing relaxed and content. The panda's distinctive black and white fur is clearly visible, with the black fur covering its ears, eyes, and limbs, while the white fur covers its face, neck, and the underside of its body. The panda's black nose and mouth are also visible.
+The panda is surrounded by green foliage, including bamboo shoots and other plants, which are typical of a panda's natural habitat. In the background, there is a wooden structure that resembles a tree stump or a small tree, adding to the naturalistic setting. The ground is covered with dirt and leaves, further emphasizing the natural environment.
+The lighting in the image is natural, suggesting that the photo was taken during the day. The overall scene conveys a sense of tranquility and the panda's comfort in its environment.
 prompt<<q
 [INFO]: 对话结束，再见。
 ```
+#### Inference with AX630C Host
 Run the following command on the Axera board to start a chat conversation:
 ```sh
+python3 infer_axmodel_620e.py -v ./fastvlm_C128_CTX512_P256_ax620e/image_encoder_512x512_ax620e.axmodel -m ./fastvlm_C128_CTX512_P256_ax620e -t fastvlm_tokenizer -i 512
 ```
+output:
+```
+[INFO] Available providers:  ['AxEngineExecutionProvider']
 Loading config, tokenizer and init model.
 [INFO] Using provider: AxEngineExecutionProvider
+[INFO] Chip type: ChipType.MC20E
 [INFO] VNPU type: VNPUType.DISABLED
+[INFO] Engine version: 2.7.2a
+[INFO] Model type: 1 (full core)
 [INFO] Compiler version: 5.1-patch1-dirty 0a5b164f-dirty
 Detected prefixes: ['llava_qwen2'], chosen: llava_qwen2, layers: 24
 Init InferenceSession:   0%|                                                                                                                          | 0/24 [00:00<?, ?it/s][INFO] Using provider: AxEngineExecutionProvider
+[INFO] Model type: 1 (full core)
 [INFO] Compiler version: 5.1-patch1-dirty 0a5b164f-dirty
+Init InferenceSession:   4%|████▊                                                                                                             | 1/24
+[00:02<00:00,  9.25it/s]
+...
 [INFO] Using provider: AxEngineExecutionProvider
+[INFO] Model type: 1 (full core)
 [INFO] Compiler version: 5.1-patch1-dirty 0a5b164f-dirty
+Init InferenceSession: 100%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 24/24 [00:02<00:00,  9.12it/s]
 [INFO] Using provider: AxEngineExecutionProvider
+[INFO] Model type: 1 (full core)
 [INFO] Compiler version: 5.1-patch1-dirty 0a5b164f-dirty
 Model loaded successfully!
 [INFO]: 输入文本进行对话，或者输入图片路径进行图片理解, 或者输入q退出对话。
 prompt<<who are you
 slice_indices: [0]
 Slice prefill done: 0
+answer >> I'm an AI language model, I don't have personal identity or a physical body. I exist solely as a digital creation created by Apple. I don't have a name or a personal identity. I'm designed to assist and provide information to users. Is there anything else I can help you with?
 prompt<<./images/ssd_horse.jpg
 slice_indices: [0]
 Slice prefill done: 0
+answer >> The image depicts a person riding a brown horse with a white blaze on its face. The rider is wearing a blue hoodie and blue jeans, and is holding the reins of the horse. The horse is standing on a dirt ground with some grass and trees in the background. The rider is also holding a rope in their left hand, which is attached to the horse's harness.
+To the left of the horse, there is a brown dog standing on the ground, looking up at the rider. The dog appears to be in a begging or pleading position, with its front paws raised and its mouth open.
+In the background, there is a gray pickup truck parked on the grass, and a wooden fence can be seen behind the horse and rider. There are also some people visible in the background, including a person in a red shirt and another person in a blue shirt. The overall scene appears to be taking place in an outdoor setting, possibly a ranch or a farm.
 prompt<<./images/image_1.jpg
 slice_indices: [0]
 Slice prefill done: 0
+answer >> The image depicts a panda bear in a naturalistic enclosure, likely within a zoo or wildlife sanctuary. The panda is sitting on its hind legs, with its front paws resting on a wooden structure that resembles a tree stump. The panda's distinctive black and white fur is clearly visible, with the black fur covering its ears, eyes, and the area around its nose and mouth, while the white fur covers the rest of its body. The panda's black nose and the black fur around its mouth are also visible.
+The panda is surrounded by green foliage, including bamboo shoots and other plants, which are typical of a panda's natural habitat. The ground appears to be covered with dirt and small rocks, and there are some larger rocks and a tree stump in the background. The lighting in the image suggests that it was taken during the daytime, with natural light illuminating the scene. The overall setting appears to be a well-maintained and naturalistic enclosure designed to mimic the panda's natural environment.
 prompt<<q
 [INFO]: 对话结束，再见。

embeds/model.embed_tokens.weight.bfloat16.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0403b365004db461375fe5d5daebcc61bab76b884844d84cbc0ba5820085e0e9
-size 272269312

 version https://git-lfs.github.com/spec/v1
+oid sha256:4bfa5dd1b4f87a9a1b42ffd26d17532d9631e0f299eee75f6d9a1ef5360ed7fb
+size 271751424

embeds/model.embed_tokens.weight.npy CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:69ebc4dd0a736c34db773c86bc708eda4dbcc626dc7bee4d363c103a9bb6d100
-size 544538752

 version https://git-lfs.github.com/spec/v1
+oid sha256:ba20f7ac021ad9bea734ba51ee01de5331611ae6b45fc35562d0cb79bf0c810c
+size 543502976

fastvlm_C128_CTX1024_P640_ax620e/image_encoder_512x512_ax620e.axmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f914c7bd4b237095742e87fbd1a0dc0974e3184bf23cd13f7194558e952effef
+size 160413696

fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l0_together.axmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:92c64b87c5a790bfdbc1ed227c6e30c040a354fdf856f1d257b88a1d09ad4571
+size 16712241

fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l10_together.axmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9cab7dc4d97e6a84957cf9d0989e50dc46fcdd4560df01014b46693c2109b81c
+size 16712217

fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l11_together.axmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:11450a57a33a8e02ac3eefa60d06818ac8ed11f2bbcca25cf61d5d5557be8613
+size 16712249

fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l12_together.axmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dbe3ec3a94528846e34c1ee61ec3b16eabbdc8ae2b437dd89a157a389e648bc8
+size 16712225

fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l13_together.axmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1c2519cfefd3be7c7376b349a545a7b4c04a414df1a5cbddd89c2bded52f013e
+size 16712321

fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l14_together.axmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:642de73dd94e59615ef64994844eec30496dcd0ad66561124225a9fd7567ca3e
+size 16712217

fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l15_together.axmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:89f5211bac18e4d8ddf825c9fd0f807dfbe498624c762193b605ddaec5bd6204
+size 16712185

fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l16_together.axmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:05b12ad7080afefd87378d7191bdc47e92bd886f17657a62a8c5caac1adcc3e2
+size 16712201

fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l17_together.axmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:417da914dd2b59daca236e0c68210387eae42deba91835735d8937a3d8efa072
+size 16712313

fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l18_together.axmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e35e10cd6a0cea16e1afe3fc16a47a05864c991bb0ded00797cdd5a9f87e84ff
+size 16712225

fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l19_together.axmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:32799a8281e5b64600a31445a703250d4beecb91a69188c19e64254cb3e4074b
+size 16712209

fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l1_together.axmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5ff1aa08b5f05457633936fce8650400fb7ad74ad9aba5711003ded4d27ee4c4
+size 16712225

fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l20_together.axmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9a2e60874879ae0c7ab60ee12eb72caaab4b4c04579d0d465374e2f3dd03af80
+size 16712233

fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l21_together.axmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:590964a4aa9fa629fad9708756909964c92071e91bcc481521be26e7ff77a037
+size 16712241

fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l22_together.axmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2fcb9deefbab7821ed686403ac328d6a3176864b38b5edc7e128a25d0836b49b
+size 16712265

fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l23_together.axmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:98d90727215c176e12d9d939975ffeb01c5b8463ca658083dfedae36d43eba6d
+size 16712209

fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l2_together.axmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8c460ec06d43433bc8c2481fe6294dd7d02533744c5bd89383b25641d2c50840
+size 16712305

fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l3_together.axmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:36e16af33f7936e81030130c796584f9863849d4fb2686aae96b8412f321050d
+size 16712241

fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l4_together.axmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3a1f020f4187d283ff134a7cbfdb2ff1cd066eef2030e8fe09def8b36d655f8b
+size 16712233

fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l5_together.axmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8d2f1967ed1305f6aa0e1ffc9fc9ed6d900d5446dede465a4de0d111519dccf1
+size 16712193

fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l6_together.axmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c54336601b83dcda22185799fff0459e8c4a2d43eadde4cfcc8093537c7c43e6
+size 16712233

fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l7_together.axmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2a926793428c6cca65a2878071570fdbad3710bcc3e6a4b12560797d4131bdcc
+size 16712217

fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l8_together.axmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:81137ad98e6d26b39059705e4e3bf5380b612e579f4c41452211f34c317f7899
+size 16712241

fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_p128_l9_together.axmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:82c2af786a8cbf7b3e1eeebd6127e91b0aff705c3080e2aa3774f05a0810f700
+size 16712289

fastvlm_C128_CTX1024_P640_ax620e/llava_qwen2_post.axmodel ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:391aff25ad252109d286cb1b393429ae0738ec1107c2fb997897351cb2e4bd0c
+size 139682851

fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l0_together.axmodel CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:11a3483817e1ce66cc95c612619a1a1e60e4bbc77a012617b0b845cde0268a11
-size 17508925

 version https://git-lfs.github.com/spec/v1
+oid sha256:7e23b62154e6d3d0a1312666632dd25cbf79c0dceafbf27795dd09aaa1d57d36
+size 18243005

fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l10_together.axmodel CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d7a88c0a139e09a37ed079166a152c6208707c84645745f2c7fed31a77c74d29
-size 17508933

 version https://git-lfs.github.com/spec/v1
+oid sha256:f0bbf3a03b783592fa8f20747acacfd144db977ac04ca5731871a37213e2ff4f
+size 18243013

fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l11_together.axmodel CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5e1060f24145f4c2f773c5ed9cbcfa04e9dd2b59f62be3772287e9f515ad2a43
-size 17508933

 version https://git-lfs.github.com/spec/v1
+oid sha256:0aa90dedd23c615109c92409eca7ee7217faa4e2814c35fd99be735fe0965cb5
+size 18243013

fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l12_together.axmodel CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:17147af14d42c305172ee511c69c33281c354dd746261a2cb6d1df326eff9868
-size 17508933

 version https://git-lfs.github.com/spec/v1
+oid sha256:db480a73fa9093f469ac1f71388f7ec7232e1f5de1956b209c2eed692200de5b
+size 18243013

fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l13_together.axmodel CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fd76a3f9d764935b7f94439762ffda93a92911dc813522076eea2c850942632b
-size 17508933

 version https://git-lfs.github.com/spec/v1
+oid sha256:93ff168d4042051532fbb52263eb7d6ca47fee2188cec02c7f433d5226c268c2
+size 18243013

fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l14_together.axmodel CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:404e37e37f43285f04d55e3b68586dd2cab0b675c5658c62ce16ad677b920cf1
-size 17508933

 version https://git-lfs.github.com/spec/v1
+oid sha256:71abc53e667625e33feff9742576bcf8d18bf060e148f39d7a8aae48de8f44c6
+size 18243013

fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l15_together.axmodel CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c8e1fd1fb7de4aa9c859543c7f07fd410bbdcd0deb6a20375f3f47024ed44cef
-size 17508933

 version https://git-lfs.github.com/spec/v1
+oid sha256:0ed18ae52df489551b0419ea855e46445e1723b5a3c089c278c193de9d0cac3a
+size 18243013

fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l16_together.axmodel CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d3020712849ef594d4104aa1402442cbeb7f334f56ef9b4b8b3e063f345cbfe3
-size 17508933

 version https://git-lfs.github.com/spec/v1
+oid sha256:f4ede5b86577c975ae12d6860b9943a0c0970a108dfd5b9d357eb34073356693
+size 18243013

fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l17_together.axmodel CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:128d8e4ea65ebedd56123097d4cc635dd0958840084b33625d06ec7b21e13355
-size 17508933

 version https://git-lfs.github.com/spec/v1
+oid sha256:45b870d4485abfd0c57350e5b87eb4b215025c2d69a3e5620061aa7e3e1e871a
+size 18243013

fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l18_together.axmodel CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9f0e61614437be65baff7c20c430eb9fde34cf85f91ef8dc7a489715cf2ae70f
-size 17508933

 version https://git-lfs.github.com/spec/v1
+oid sha256:3fa5072204d85a50f1115e3d8de609f33d9b9e792a4ea2a0c9e572b02b986242
+size 18243013

fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l19_together.axmodel CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e92084c4a8117981ba9b7f5da0086c1bad38c4a7e8b87d4ba9193883f329b4b5
-size 17508933

 version https://git-lfs.github.com/spec/v1
+oid sha256:07b011ce1b1c94dc2f03643d7fc086736f9ad76b9755081b43eb2b7532526e83
+size 18243013

fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l1_together.axmodel CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2867a766cdba85a8e925d96d67757193be73e38267a653d8c78ebc7a3d1af5dd
-size 17508925

 version https://git-lfs.github.com/spec/v1
+oid sha256:dd07df17677123fe11b3ede1409791c86b21f3ed6fb088fcf7e1981583172ee8
+size 18243005

fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l20_together.axmodel CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c846e6bb008b448a4922297eed660f111780e3a0719f695100dec1564b4e23b2
-size 17508933

 version https://git-lfs.github.com/spec/v1
+oid sha256:20648131068b6fd7be58699f6b34191ba7f6b0bf2b5622234e09fc1e713ca955
+size 18243013

fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l21_together.axmodel CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fc450fbd546cffe53250b9e74454faf9e452ec4412a11ec07e3b1857e7d64c70
-size 17508933

 version https://git-lfs.github.com/spec/v1
+oid sha256:9806631129785f025cff5147abae93ae11b02fee39d987c4e3e387ff438e4238
+size 18243013

fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l22_together.axmodel CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3595909c86c5706da8d49c9b87616d033ea1070b1ac08ab7802b63409fbeda99
-size 17508933

 version https://git-lfs.github.com/spec/v1
+oid sha256:473eccc3e07a4f3bcfe79a2fc55f17650472e09c2b22f3bd60d3700e30bb4340
+size 18243013

fastvlm_C128_CTX1024_P640_ax650/llava_qwen2_p128_l23_together.axmodel CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f91903d8a7313f1ce17cbc43cec71e4d72d0e358d893ce8da6f99b71622b641a
-size 17508933

 version https://git-lfs.github.com/spec/v1
+oid sha256:bd4ad9014b4bda50eb37d7481871d6c1a0dadf3e677a52514d368f33d56b31f7
+size 18243013