Update build_mlc_android.sh
Browse files- build_mlc_android.sh +3 -3
build_mlc_android.sh
CHANGED
@@ -20,7 +20,7 @@ MODEL_NAME="Qwen2-7B-Instruct-Tinytron-MLC"
|
|
20 |
mlc_llm convert_weight --device cpu ${MODEL_PATH} --quantization ${QUANTIZATION} -o ${MODEL_OUTPUT_PATH}/${MODEL_NAME}/
|
21 |
|
22 |
# ็ๆ้
็ฝฎ
|
23 |
-
mlc_llm gen_config ${MODEL_PATH} --conv-template
|
24 |
|
25 |
# ๅๆขๆจกๅ
|
26 |
MODEL_PATH="Phi-2-Tinytron-preview"
|
@@ -29,7 +29,7 @@ MODEL_NAME="Phi-2-Tinytron-preview-MLC"
|
|
29 |
mlc_llm convert_weight --device cpu ${MODEL_PATH} --quantization ${QUANTIZATION} -o ${MODEL_OUTPUT_PATH}/${MODEL_NAME}/
|
30 |
|
31 |
# ็ๆ้
็ฝฎ
|
32 |
-
mlc_llm gen_config ${MODEL_PATH} --conv-template
|
33 |
|
34 |
MODEL_PATH="Cauchy-3B-preview"
|
35 |
MODEL_NAME="Cauchy-3B-preview-MLC"
|
@@ -37,5 +37,5 @@ MODEL_NAME="Cauchy-3B-preview-MLC"
|
|
37 |
mlc_llm convert_weight --model-type cauchy --device cpu ${MODEL_PATH} --quantization ${QUANTIZATION} -o ${MODEL_OUTPUT_PATH}/${MODEL_NAME}/
|
38 |
|
39 |
# ็ๆ้
็ฝฎ
|
40 |
-
mlc_llm gen_config ${MODEL_PATH} --model-type cauchy --conv-template
|
41 |
|
|
|
20 |
mlc_llm convert_weight --device cpu ${MODEL_PATH} --quantization ${QUANTIZATION} -o ${MODEL_OUTPUT_PATH}/${MODEL_NAME}/
|
21 |
|
22 |
# ็ๆ้
็ฝฎ
|
23 |
+
mlc_llm gen_config ${MODEL_PATH} --conv-template qwen2 --quantization ${QUANTIZATION} --context-window-size 512 --prefill-chunk-size=16 --max-batch-size=1 -o ${MODEL_OUTPUT_PATH}/${MODEL_NAME}/
|
24 |
|
25 |
# ๅๆขๆจกๅ
|
26 |
MODEL_PATH="Phi-2-Tinytron-preview"
|
|
|
29 |
mlc_llm convert_weight --device cpu ${MODEL_PATH} --quantization ${QUANTIZATION} -o ${MODEL_OUTPUT_PATH}/${MODEL_NAME}/
|
30 |
|
31 |
# ็ๆ้
็ฝฎ
|
32 |
+
mlc_llm gen_config ${MODEL_PATH} --conv-template qwen2 --quantization ${QUANTIZATION} --context-window-size 512 --prefill-chunk-size=16 --max-batch-size=1 -o ${MODEL_OUTPUT_PATH}/${MODEL_NAME}/
|
33 |
|
34 |
MODEL_PATH="Cauchy-3B-preview"
|
35 |
MODEL_NAME="Cauchy-3B-preview-MLC"
|
|
|
37 |
mlc_llm convert_weight --model-type cauchy --device cpu ${MODEL_PATH} --quantization ${QUANTIZATION} -o ${MODEL_OUTPUT_PATH}/${MODEL_NAME}/
|
38 |
|
39 |
# ็ๆ้
็ฝฎ
|
40 |
+
mlc_llm gen_config ${MODEL_PATH} --model-type cauchy --conv-template qwen2 --quantization ${QUANTIZATION} --context-window-size 512 --prefill-chunk-size=16 --max-batch-size=1 -o ${MODEL_OUTPUT_PATH}/${MODEL_NAME}/
|
41 |
|