Qwen2.5-7B-Instruct-TensorParallel / run_qwen2.5_7B_axcl_context_tp.sh
zheqiushui's picture
Upload 38 files
50cd6d5 verified
./main_tp_x86 \
--template_filename_axmodel "qwen2.5_7b_tp/qwen2_p128_l%d_together.tar" \
--axmodel_num 28 \
--tokenizer_type 2 \
--url_tokenizer_model "http://127.0.0.1:12345" \
--filename_post_axmodel "qwen2.5_7b_tp/qwen2_post.tar" \
--filename_tokens_embed "qwen2.5_7b_tp/model.embed_tokens.weight.bfloat16.bin" \
--tokens_embed_num 152064 \
--tokens_embed_size 3584 \
--use_mmap_load_embed 1 \
--live_print 1 \
--devices 0,1,2,3