wli1995 commited on
Commit
21677d1
·
verified ·
1 Parent(s): 60bc88e

Upload folder using huggingface_hub

Browse files
main_api_ax650 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:53024db31c1fe910d5b13f3e31daf903bfde87ee18d29d49a4094aadb883517f
3
- size 1064648
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e800cd6e00dd2ad7303cb6fb6b867a33704665bded213fe4bd3be3df025c0821
3
+ size 1064760
main_ax650 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:622b8f33f3d6e9caf0b5aac480a5327d5f92b419d717b7403cb72807fa1e3fc7
3
- size 985248
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f19ddeb193769b16aa8c5d9bba887558aa0a4ed10eb50a19d9bc117f1ba527e5
3
+ size 985352
run_qwen2.5_7b_ctx_ax650.sh CHANGED
@@ -1,9 +1,9 @@
1
  ./main_ax650 \
2
- --template_filename_axmodel "qwen2.5-7b-ctx-ax650/qwen2_p128_l%d_together.axmodel" \
3
  --axmodel_num 28 \
4
  --url_tokenizer_model "http://0.0.0.0:12345" \
5
- --filename_post_axmodel "qwen2.5-7b-ctx-ax650/qwen2_post.axmodel" \
6
- --filename_tokens_embed "qwen2.5-7b-ctx-ax650/model.embed_tokens.weight.bfloat16.bin" \
7
  --tokens_embed_num 152064 \
8
  --tokens_embed_size 3584 \
9
  --use_mmap_load_embed 1 \
 
1
  ./main_ax650 \
2
+ --template_filename_axmodel "qwen2.5-7b-ctx-int4-ax650/qwen2_p128_l%d_together.axmodel" \
3
  --axmodel_num 28 \
4
  --url_tokenizer_model "http://0.0.0.0:12345" \
5
+ --filename_post_axmodel "qwen2.5-7b-ctx-int4-ax650/qwen2_post.axmodel" \
6
+ --filename_tokens_embed "qwen2.5-7b-ctx-int4-ax650/model.embed_tokens.weight.bfloat16.bin" \
7
  --tokens_embed_num 152064 \
8
  --tokens_embed_size 3584 \
9
  --use_mmap_load_embed 1 \
run_qwen2.5_7b_ctx_int4_ax650.sh CHANGED
@@ -1,5 +1,6 @@
1
  ./main_ax650 \
2
  --template_filename_axmodel "qwen2.5-7b-ctx-int4-ax650/qwen2_p128_l%d_together.axmodel" \
 
3
  --url_tokenizer_model "http://0.0.0.0:12345" \
4
  --filename_post_axmodel "qwen2.5-7b-ctx-int4-ax650/qwen2_post.axmodel" \
5
  --filename_tokens_embed "qwen2.5-7b-ctx-int4-ax650/model.embed_tokens.weight.bfloat16.bin" \
 
1
  ./main_ax650 \
2
  --template_filename_axmodel "qwen2.5-7b-ctx-int4-ax650/qwen2_p128_l%d_together.axmodel" \
3
+ --axmodel_num 28 \
4
  --url_tokenizer_model "http://0.0.0.0:12345" \
5
  --filename_post_axmodel "qwen2.5-7b-ctx-int4-ax650/qwen2_post.axmodel" \
6
  --filename_tokens_embed "qwen2.5-7b-ctx-int4-ax650/model.embed_tokens.weight.bfloat16.bin" \