add run_qwen2.5_7b_ctx_int4_axcl_aarch64_api.sh
#1
by
nickshek - opened
run_qwen2.5_7b_ctx_int4_axcl_aarch64_api.sh
ADDED
|
@@ -0,0 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
./main_api_axcl_aarch64 \
|
| 2 |
+
--template_filename_axmodel "qwen2.5-7b-ctx-int4-ax650/qwen2_p128_l%d_together.axmodel" \
|
| 3 |
+
--axmodel_num 28 \
|
| 4 |
+
--url_tokenizer_model "http://0.0.0.0:12345" \
|
| 5 |
+
--filename_post_axmodel "qwen2.5-7b-ctx-int4-ax650/qwen2_post.axmodel" \
|
| 6 |
+
--filename_tokens_embed "qwen2.5-7b-ctx-int4-ax650/model.embed_tokens.weight.bfloat16.bin" \
|
| 7 |
+
--tokens_embed_num 152064 \
|
| 8 |
+
--tokens_embed_size 3584 \
|
| 9 |
+
--use_mmap_load_embed 1 \
|
| 10 |
+
--devices 0
|
| 11 |
+
|
| 12 |
+
|
| 13 |
+
#--system_prompt "你的名字叫小智(allen),你是一个人畜无害的AI助手。深圳市今天(4月1日)阴天,愚人节,气温在14°C至19°C之间,微风。" \
|
| 14 |
+
#--kvcache_path "./kvcache" \
|
| 15 |
+
|