SmolLM2-360M-Instruct / run_smollm2_360m_ax630c.sh
qqc1989's picture
update the axmodel of ax630c
be2089b verified
./main_prefill \
--template_filename_axmodel "smollm2-360m-ax630c/llama_p128_l%d_together.axmodel" \
--axmodel_num 32 \
--tokenizer_type 2 \
--filename_tokenizer_model "http://127.0.0.1:12345" \
--bos 0 --eos 0 \
--filename_post_axmodel "smollm2-360m-ax630c/llama_post.axmodel" \
--filename_tokens_embed "smollm2-360m-ax630c/model.embed_tokens.weight.bfloat16.bin" \
--tokens_embed_num 49152 \
--tokens_embed_size 960 \
--use_mmap_load_embed 1 \
--live_print 1 \
--continue 1 \
--prompt "$1"