Update build_mlc_android.sh
Browse files- build_mlc_android.sh +3 -3
build_mlc_android.sh
CHANGED
|
@@ -20,7 +20,7 @@ MODEL_NAME="Qwen2-7B-Instruct-Tinytron-MLC"
|
|
| 20 |
mlc_llm convert_weight --device cpu ${MODEL_PATH} --quantization ${QUANTIZATION} -o ${MODEL_OUTPUT_PATH}/${MODEL_NAME}/
|
| 21 |
|
| 22 |
# ็ๆ้
็ฝฎ
|
| 23 |
-
mlc_llm gen_config ${MODEL_PATH} --conv-template
|
| 24 |
|
| 25 |
# ๅๆขๆจกๅ
|
| 26 |
MODEL_PATH="Phi-2-Tinytron-preview"
|
|
@@ -29,7 +29,7 @@ MODEL_NAME="Phi-2-Tinytron-preview-MLC"
|
|
| 29 |
mlc_llm convert_weight --device cpu ${MODEL_PATH} --quantization ${QUANTIZATION} -o ${MODEL_OUTPUT_PATH}/${MODEL_NAME}/
|
| 30 |
|
| 31 |
# ็ๆ้
็ฝฎ
|
| 32 |
-
mlc_llm gen_config ${MODEL_PATH} --conv-template
|
| 33 |
|
| 34 |
MODEL_PATH="Cauchy-3B-preview"
|
| 35 |
MODEL_NAME="Cauchy-3B-preview-MLC"
|
|
@@ -37,5 +37,5 @@ MODEL_NAME="Cauchy-3B-preview-MLC"
|
|
| 37 |
mlc_llm convert_weight --model-type cauchy --device cpu ${MODEL_PATH} --quantization ${QUANTIZATION} -o ${MODEL_OUTPUT_PATH}/${MODEL_NAME}/
|
| 38 |
|
| 39 |
# ็ๆ้
็ฝฎ
|
| 40 |
-
mlc_llm gen_config ${MODEL_PATH} --model-type cauchy --conv-template
|
| 41 |
|
|
|
|
| 20 |
mlc_llm convert_weight --device cpu ${MODEL_PATH} --quantization ${QUANTIZATION} -o ${MODEL_OUTPUT_PATH}/${MODEL_NAME}/
|
| 21 |
|
| 22 |
# ็ๆ้
็ฝฎ
|
| 23 |
+
mlc_llm gen_config ${MODEL_PATH} --conv-template qwen2 --quantization ${QUANTIZATION} --context-window-size 512 --prefill-chunk-size=16 --max-batch-size=1 -o ${MODEL_OUTPUT_PATH}/${MODEL_NAME}/
|
| 24 |
|
| 25 |
# ๅๆขๆจกๅ
|
| 26 |
MODEL_PATH="Phi-2-Tinytron-preview"
|
|
|
|
| 29 |
mlc_llm convert_weight --device cpu ${MODEL_PATH} --quantization ${QUANTIZATION} -o ${MODEL_OUTPUT_PATH}/${MODEL_NAME}/
|
| 30 |
|
| 31 |
# ็ๆ้
็ฝฎ
|
| 32 |
+
mlc_llm gen_config ${MODEL_PATH} --conv-template qwen2 --quantization ${QUANTIZATION} --context-window-size 512 --prefill-chunk-size=16 --max-batch-size=1 -o ${MODEL_OUTPUT_PATH}/${MODEL_NAME}/
|
| 33 |
|
| 34 |
MODEL_PATH="Cauchy-3B-preview"
|
| 35 |
MODEL_NAME="Cauchy-3B-preview-MLC"
|
|
|
|
| 37 |
mlc_llm convert_weight --model-type cauchy --device cpu ${MODEL_PATH} --quantization ${QUANTIZATION} -o ${MODEL_OUTPUT_PATH}/${MODEL_NAME}/
|
| 38 |
|
| 39 |
# ็ๆ้
็ฝฎ
|
| 40 |
+
mlc_llm gen_config ${MODEL_PATH} --model-type cauchy --conv-template qwen2 --quantization ${QUANTIZATION} --context-window-size 512 --prefill-chunk-size=16 --max-batch-size=1 -o ${MODEL_OUTPUT_PATH}/${MODEL_NAME}/
|
| 41 |
|