File size: 630 Bytes
d8727b9
 
 
 
 
 
 
 
 
 
 
 
 
2aca529
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
./main_ax650 \
--system_prompt "You are Qwen, created by Alibaba Cloud. You are a helpful assistant." \
--template_filename_axmodel "qwen2.5-0.5b-gptq-int8-ctx-ax630c/qwen2_p128_l%d_together.axmodel" \
--axmodel_num 24 \
--url_tokenizer_model "http://127.0.0.1:12345" \
--filename_post_axmodel "qwen2.5-0.5b-gptq-int8-ctx-ax630c/qwen2_post.axmodel" \
--filename_tokens_embed "qwen2.5-0.5b-gptq-int8-ctx-ax630c/model.embed_tokens.weight.bfloat16.bin" \
--tokens_embed_num 151936 \
--tokens_embed_size 896 \
--use_mmap_load_embed 0 \
--live_print 1

# --kvcache_path /home/axera/ax-llm/build/kvcache_yuanqi \
# --tokenizer_type 2 \