diff --git a/.gitattributes b/.gitattributes index a6344aac8c09253b3b630fb776ae94478aa0275b..cb75bd41b572db1d6c5c37a021fa60db5bc82cf2 100644 --- a/.gitattributes +++ b/.gitattributes @@ -33,3 +33,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +ggml/weights.gguf filter=lfs diff=lfs merge=lfs -text +vocab.gguf filter=lfs diff=lfs merge=lfs -text diff --git a/ggml/weights.gguf b/ggml/weights.gguf new file mode 100644 index 0000000000000000000000000000000000000000..235e7bb6e4b0afffb687aef5dd548cf8c8ee600c --- /dev/null +++ b/ggml/weights.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e2b762cb389efa5a3d42bf36d8ac827daf1e78e939fde463c05d26d86a2a048 +size 1742627744 diff --git a/model.json b/model.json new file mode 100644 index 0000000000000000000000000000000000000000..b6651ef21f5e184bfa45f3fca9dba74180b7bece --- /dev/null +++ b/model.json @@ -0,0 +1,27 @@ +{ + "model_id": "test", + "model_arch": "qwen2", + "version": 20241202, + "llm_config": { + "embed_dim": 2048, + "ffn_dim": 11008, + "head_size": 128, + "kv_dim": 256, + "n_attn_heads": 16, + "n_attn_kv_heads": 2, + "n_ctx": 32768, + "n_layers": 36, + "norm_eps": 9.999999974752427e-07, + "vocab_size": 151936, + "rope_config": { + "n_rope_ctx_orig": 32768, + "rope_attn_factor": 1.0, + "rope_dim": 128, + "rope_freq_base": 1000000.0, + "rope_freq_scale": 1.0, + "rope_scale_type": "linear", + "rope_type": -1 + } + }, + "vision": {} +} \ No newline at end of file diff --git a/qnn/config.json b/qnn/config.json new file mode 100644 index 0000000000000000000000000000000000000000..3a6f21821873fc3405c8e66615aaf14ba9c9b72e --- /dev/null +++ b/qnn/config.json @@ -0,0 +1,91 @@ +{ + "model_parameters": { + "n_layers": 36, + "vocab_size": 151936, + "embed_dim": 2048, + "ffn_hidden_dim": 11008, + "head_dim": 128, + "n_kv_heads": 2, + "rope_theta": 1000000.0, + "rms_norm_eps": 1e-06, + "attention_mask_value": -50000.0, + "tie_embedding": true + }, + "qnn_parameters": { + "n_hvx_threads": 4 + }, + "graphs": [ + { + "type": "transformers", + "start_layer_id": 0, + "end_layer_id": 18, + "batch_size": 1, + "cache_size": 1920, + "context_size": 2048, + "graph_name": "batch_1", + "model_path": "qwen2.5_3b_0.bin", + "kv_path_format": "kv/layer_{layer_id}_{kv_type}_{head_id}.raw", + "kv_size": 11, + "x_name": "x", + "out_name": "out" + }, + { + "type": "transformers", + "start_layer_id": 18, + "end_layer_id": 36, + "batch_size": 1, + "cache_size": 1920, + "context_size": 2048, + "graph_name": "batch_1", + "model_path": "qwen2.5_3b_1.bin", + "kv_path_format": "kv/layer_{layer_id}_{kv_type}_{head_id}.raw", + "kv_size": 11, + "x_name": "x", + "out_name": "out" + }, + { + "type": "transformers", + "start_layer_id": 0, + "end_layer_id": 18, + "batch_size": 128, + "cache_size": 1920, + "context_size": 2048, + "graph_name": "batch_128", + "model_path": "qwen2.5_3b_0.bin", + "kv_path_format": "kv/layer_{layer_id}_{kv_type}_{head_id}.raw", + "kv_size": 11, + "x_name": "x", + "out_name": "out" + }, + { + "type": "transformers", + "start_layer_id": 18, + "end_layer_id": 36, + "batch_size": 128, + "cache_size": 1920, + "context_size": 2048, + "graph_name": "batch_128", + "model_path": "qwen2.5_3b_1.bin", + "kv_path_format": "kv/layer_{layer_id}_{kv_type}_{head_id}.raw", + "kv_size": 11, + "x_name": "x", + "out_name": "out" + } + ], + "embeddings": [ + { + "graph_name": "batch_1", + "model_path": "lm_head.bin", + "batch_size": 1, + "x_name": "x", + "out_name": "logits" + }, + { + "graph_name": "batch_128", + "model_path": "lm_head.bin", + "batch_size": 128, + "x_name": "x", + "out_name": "logits" + } + ] +} \ No newline at end of file diff --git a/qnn/kv/layer_0_key_0.raw b/qnn/kv/layer_0_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..e72b4e663f4b7c47ad3695458b7b3671a635dccd Binary files /dev/null and b/qnn/kv/layer_0_key_0.raw differ diff --git a/qnn/kv/layer_0_key_1.raw b/qnn/kv/layer_0_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..cc07efd42b7e85c19e61d52e19cbfd6562108ee4 Binary files /dev/null and b/qnn/kv/layer_0_key_1.raw differ diff --git a/qnn/kv/layer_0_value_0.raw b/qnn/kv/layer_0_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..b76a7d218ec25383146020abbcc5ed91b8505f69 Binary files /dev/null and b/qnn/kv/layer_0_value_0.raw differ diff --git a/qnn/kv/layer_0_value_1.raw b/qnn/kv/layer_0_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..498182ba5bd0f992441d611fd05ce871ba629064 Binary files /dev/null and b/qnn/kv/layer_0_value_1.raw differ diff --git a/qnn/kv/layer_10_key_0.raw b/qnn/kv/layer_10_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..4591d69ed0c2a9dc2c3fe17fb528664d94b7b40f Binary files /dev/null and b/qnn/kv/layer_10_key_0.raw differ diff --git a/qnn/kv/layer_10_key_1.raw b/qnn/kv/layer_10_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..648a089801e2f9eba27a0c4944b0a4b91fe83940 Binary files /dev/null and b/qnn/kv/layer_10_key_1.raw differ diff --git a/qnn/kv/layer_10_value_0.raw b/qnn/kv/layer_10_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..92f9b93237cb1403c7b2e1202ad3d59d90a1a4f8 Binary files /dev/null and b/qnn/kv/layer_10_value_0.raw differ diff --git a/qnn/kv/layer_10_value_1.raw b/qnn/kv/layer_10_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..229227f998c4d10a2efd529cf72c53fc65c6f6d1 Binary files /dev/null and b/qnn/kv/layer_10_value_1.raw differ diff --git a/qnn/kv/layer_11_key_0.raw b/qnn/kv/layer_11_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..b09d4f64d4ad994742f61c5256e2cea4f663ddc2 Binary files /dev/null and b/qnn/kv/layer_11_key_0.raw differ diff --git a/qnn/kv/layer_11_key_1.raw b/qnn/kv/layer_11_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..9b0df21840bcbe20e5ee3f6a34c72f35315414fb Binary files /dev/null and b/qnn/kv/layer_11_key_1.raw differ diff --git a/qnn/kv/layer_11_value_0.raw b/qnn/kv/layer_11_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..d0c91868fec7f10c1644b483ca828c0f8e176c47 Binary files /dev/null and b/qnn/kv/layer_11_value_0.raw differ diff --git a/qnn/kv/layer_11_value_1.raw b/qnn/kv/layer_11_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..0cc48806d57347bd17ce394e0c3e67da010134ee Binary files /dev/null and b/qnn/kv/layer_11_value_1.raw differ diff --git a/qnn/kv/layer_12_key_0.raw b/qnn/kv/layer_12_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..ea10e325d4b77decfbffe462b20b3f1fec8e9570 Binary files /dev/null and b/qnn/kv/layer_12_key_0.raw differ diff --git a/qnn/kv/layer_12_key_1.raw b/qnn/kv/layer_12_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..1ddcf2b2a4b4d581667102535618460b0a804a75 Binary files /dev/null and b/qnn/kv/layer_12_key_1.raw differ diff --git a/qnn/kv/layer_12_value_0.raw b/qnn/kv/layer_12_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..683a8dbfcb9d97fcde3d7842ffb9424fbfc8d306 Binary files /dev/null and b/qnn/kv/layer_12_value_0.raw differ diff --git a/qnn/kv/layer_12_value_1.raw b/qnn/kv/layer_12_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..bd460c02fab00480c5ce295c401d2c5ee3e0ded0 Binary files /dev/null and b/qnn/kv/layer_12_value_1.raw differ diff --git a/qnn/kv/layer_13_key_0.raw b/qnn/kv/layer_13_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..76b247ec72deba7fadabff9ac7fad355c4037252 Binary files /dev/null and b/qnn/kv/layer_13_key_0.raw differ diff --git a/qnn/kv/layer_13_key_1.raw b/qnn/kv/layer_13_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..0596c3915a8036e9f536d35735ea7a9dab2ff67a Binary files /dev/null and b/qnn/kv/layer_13_key_1.raw differ diff --git a/qnn/kv/layer_13_value_0.raw b/qnn/kv/layer_13_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..09de3fb76fcd0bed80a456760670934d3177917c Binary files /dev/null and b/qnn/kv/layer_13_value_0.raw differ diff --git a/qnn/kv/layer_13_value_1.raw b/qnn/kv/layer_13_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..8866f377013e431b4ac07ec027840122b23edaef Binary files /dev/null and b/qnn/kv/layer_13_value_1.raw differ diff --git a/qnn/kv/layer_14_key_0.raw b/qnn/kv/layer_14_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..dcaa91260bfafefa167122d63861d4866d2a062b Binary files /dev/null and b/qnn/kv/layer_14_key_0.raw differ diff --git a/qnn/kv/layer_14_key_1.raw b/qnn/kv/layer_14_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..a9318491e64e2920f1d6aa5286fd9e225b8f2ce2 Binary files /dev/null and b/qnn/kv/layer_14_key_1.raw differ diff --git a/qnn/kv/layer_14_value_0.raw b/qnn/kv/layer_14_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..d40c50319a75f1e0ce2b42f97ed3714325dd8c0a Binary files /dev/null and b/qnn/kv/layer_14_value_0.raw differ diff --git a/qnn/kv/layer_14_value_1.raw b/qnn/kv/layer_14_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..0a0ad76145f0e3a7bb7856e4cbb7d9145c508163 Binary files /dev/null and b/qnn/kv/layer_14_value_1.raw differ diff --git a/qnn/kv/layer_15_key_0.raw b/qnn/kv/layer_15_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..fb2a4ea9e4d1d631760f3e1780e6de291671aa05 Binary files /dev/null and b/qnn/kv/layer_15_key_0.raw differ diff --git a/qnn/kv/layer_15_key_1.raw b/qnn/kv/layer_15_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..ca374e80f68bdf405014d0830e5a86aa772ec444 Binary files /dev/null and b/qnn/kv/layer_15_key_1.raw differ diff --git a/qnn/kv/layer_15_value_0.raw b/qnn/kv/layer_15_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..6c9e280aacf1deac462a0842d1df270185f564e5 Binary files /dev/null and b/qnn/kv/layer_15_value_0.raw differ diff --git a/qnn/kv/layer_15_value_1.raw b/qnn/kv/layer_15_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..2734b2b5c8843cacc322e47e162a77b3d2b8f80d Binary files /dev/null and b/qnn/kv/layer_15_value_1.raw differ diff --git a/qnn/kv/layer_16_key_0.raw b/qnn/kv/layer_16_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..955f6f4ab0fcb81d0d4a18e2bad82ada8f7008a1 Binary files /dev/null and b/qnn/kv/layer_16_key_0.raw differ diff --git a/qnn/kv/layer_16_key_1.raw b/qnn/kv/layer_16_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..70152dd09e3e44ae44add637acf7ea71d21635b9 Binary files /dev/null and b/qnn/kv/layer_16_key_1.raw differ diff --git a/qnn/kv/layer_16_value_0.raw b/qnn/kv/layer_16_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..74d09a3fdbc591d52969549aeace52806b9703d8 Binary files /dev/null and b/qnn/kv/layer_16_value_0.raw differ diff --git a/qnn/kv/layer_16_value_1.raw b/qnn/kv/layer_16_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..eae0c72c18884f701177f5a7eee55108e2577178 Binary files /dev/null and b/qnn/kv/layer_16_value_1.raw differ diff --git a/qnn/kv/layer_17_key_0.raw b/qnn/kv/layer_17_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..adcce59b7c92838f9f44ab4121d6c5fa44546bcb Binary files /dev/null and b/qnn/kv/layer_17_key_0.raw differ diff --git a/qnn/kv/layer_17_key_1.raw b/qnn/kv/layer_17_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..263986712e1045607f8bed5a9bca64e8e119c171 Binary files /dev/null and b/qnn/kv/layer_17_key_1.raw differ diff --git a/qnn/kv/layer_17_value_0.raw b/qnn/kv/layer_17_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..48148cf36814171fb8a0daa03300994370b3461c Binary files /dev/null and b/qnn/kv/layer_17_value_0.raw differ diff --git a/qnn/kv/layer_17_value_1.raw b/qnn/kv/layer_17_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..7f3eb70125ca2279f6e1552cafdfee3755235c2c Binary files /dev/null and b/qnn/kv/layer_17_value_1.raw differ diff --git a/qnn/kv/layer_18_key_0.raw b/qnn/kv/layer_18_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..2fb85c8fda83ce50f06a1b0b0611dea507e82254 Binary files /dev/null and b/qnn/kv/layer_18_key_0.raw differ diff --git a/qnn/kv/layer_18_key_1.raw b/qnn/kv/layer_18_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..27ed9fa5ac66cfaa2ad9c4db750dc370c04d3bbd Binary files /dev/null and b/qnn/kv/layer_18_key_1.raw differ diff --git a/qnn/kv/layer_18_value_0.raw b/qnn/kv/layer_18_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..67f1e9a361721a8d547b8dbef81f44c38e0892b7 Binary files /dev/null and b/qnn/kv/layer_18_value_0.raw differ diff --git a/qnn/kv/layer_18_value_1.raw b/qnn/kv/layer_18_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..75b6524722449eeb81b8a4ccb741c5c8b5ace11b Binary files /dev/null and b/qnn/kv/layer_18_value_1.raw differ diff --git a/qnn/kv/layer_19_key_0.raw b/qnn/kv/layer_19_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..7666218b4d2a7593248fb58cef01ce25a9853cbf Binary files /dev/null and b/qnn/kv/layer_19_key_0.raw differ diff --git a/qnn/kv/layer_19_key_1.raw b/qnn/kv/layer_19_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..be1d9c847d6f8988d066d6be4cbfb9f6403d42ef Binary files /dev/null and b/qnn/kv/layer_19_key_1.raw differ diff --git a/qnn/kv/layer_19_value_0.raw b/qnn/kv/layer_19_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..0864a8e76ad848d110c21b80b5b8f44c1e2cad23 Binary files /dev/null and b/qnn/kv/layer_19_value_0.raw differ diff --git a/qnn/kv/layer_19_value_1.raw b/qnn/kv/layer_19_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..5eb7962b6bdb0aaa2c5930a0193362c1ab58b686 Binary files /dev/null and b/qnn/kv/layer_19_value_1.raw differ diff --git a/qnn/kv/layer_1_key_0.raw b/qnn/kv/layer_1_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..bca44d7259ffa891e2d14140b2427aca26d9f213 Binary files /dev/null and b/qnn/kv/layer_1_key_0.raw differ diff --git a/qnn/kv/layer_1_key_1.raw b/qnn/kv/layer_1_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..271e8ef366dd6b7342b53a127b28634d1d5c8bb9 Binary files /dev/null and b/qnn/kv/layer_1_key_1.raw differ diff --git a/qnn/kv/layer_1_value_0.raw b/qnn/kv/layer_1_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..198cc44701faba554ed7d43941a8a026fe1cbbb5 Binary files /dev/null and b/qnn/kv/layer_1_value_0.raw differ diff --git a/qnn/kv/layer_1_value_1.raw b/qnn/kv/layer_1_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..e080d5fcb4e4a319f83d9535dff20b4dd39b72f2 Binary files /dev/null and b/qnn/kv/layer_1_value_1.raw differ diff --git a/qnn/kv/layer_20_key_0.raw b/qnn/kv/layer_20_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..49c0485b7f87ebac6a9b7fbc08da16ce50929e95 Binary files /dev/null and b/qnn/kv/layer_20_key_0.raw differ diff --git a/qnn/kv/layer_20_key_1.raw b/qnn/kv/layer_20_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..249e3bca6adfc6d06110c87edc166a2f32736814 Binary files /dev/null and b/qnn/kv/layer_20_key_1.raw differ diff --git a/qnn/kv/layer_20_value_0.raw b/qnn/kv/layer_20_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..7f0de00827a45d924d58419d70397ae9d69b168f Binary files /dev/null and b/qnn/kv/layer_20_value_0.raw differ diff --git a/qnn/kv/layer_20_value_1.raw b/qnn/kv/layer_20_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..38a7f2be4bf968e733cd7beae0a2915b270adda3 Binary files /dev/null and b/qnn/kv/layer_20_value_1.raw differ diff --git a/qnn/kv/layer_21_key_0.raw b/qnn/kv/layer_21_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..439b65e12893a32a05420088a7549546567ebcc1 Binary files /dev/null and b/qnn/kv/layer_21_key_0.raw differ diff --git a/qnn/kv/layer_21_key_1.raw b/qnn/kv/layer_21_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..b8a9bd08ae617a290c08c74c70074191121c876a Binary files /dev/null and b/qnn/kv/layer_21_key_1.raw differ diff --git a/qnn/kv/layer_21_value_0.raw b/qnn/kv/layer_21_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..6259fa425aa2c3a82b44d98a81b8d55c4b626732 Binary files /dev/null and b/qnn/kv/layer_21_value_0.raw differ diff --git a/qnn/kv/layer_21_value_1.raw b/qnn/kv/layer_21_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..6053d201c8d57ab23c49b70bf75ef3142a365a3a Binary files /dev/null and b/qnn/kv/layer_21_value_1.raw differ diff --git a/qnn/kv/layer_22_key_0.raw b/qnn/kv/layer_22_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..6f9201e7cbce8c94eaa39197c757065a8f0ede81 Binary files /dev/null and b/qnn/kv/layer_22_key_0.raw differ diff --git a/qnn/kv/layer_22_key_1.raw b/qnn/kv/layer_22_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..a3a684131e8a1e554bfd83ba958a5d78bb914098 Binary files /dev/null and b/qnn/kv/layer_22_key_1.raw differ diff --git a/qnn/kv/layer_22_value_0.raw b/qnn/kv/layer_22_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..f0ab850c5090eee9dadf888eaa1f26f23a27dd8e Binary files /dev/null and b/qnn/kv/layer_22_value_0.raw differ diff --git a/qnn/kv/layer_22_value_1.raw b/qnn/kv/layer_22_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..3d2d0d62441a72ebae407f29ae82954b1772134b Binary files /dev/null and b/qnn/kv/layer_22_value_1.raw differ diff --git a/qnn/kv/layer_23_key_0.raw b/qnn/kv/layer_23_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..5a7dab57033f1df32e11d6d202148099b3cc0540 Binary files /dev/null and b/qnn/kv/layer_23_key_0.raw differ diff --git a/qnn/kv/layer_23_key_1.raw b/qnn/kv/layer_23_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..a47218d545ea7625c999c606f02ed9d6b430beaa Binary files /dev/null and b/qnn/kv/layer_23_key_1.raw differ diff --git a/qnn/kv/layer_23_value_0.raw b/qnn/kv/layer_23_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..4f1feb17705cf6de00b9060fc1c99915f4270727 Binary files /dev/null and b/qnn/kv/layer_23_value_0.raw differ diff --git a/qnn/kv/layer_23_value_1.raw b/qnn/kv/layer_23_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..518628ae22542ca3760f417072c944d95ac87edc Binary files /dev/null and b/qnn/kv/layer_23_value_1.raw differ diff --git a/qnn/kv/layer_24_key_0.raw b/qnn/kv/layer_24_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..4e8a334c3ab1f957afc4ddb28545deb7375457b3 Binary files /dev/null and b/qnn/kv/layer_24_key_0.raw differ diff --git a/qnn/kv/layer_24_key_1.raw b/qnn/kv/layer_24_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..15fa92bf62c5af354671f177c437bd4fbb1d9057 Binary files /dev/null and b/qnn/kv/layer_24_key_1.raw differ diff --git a/qnn/kv/layer_24_value_0.raw b/qnn/kv/layer_24_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..53f171695c7672cf2c9d93bf28ebb6450992233c Binary files /dev/null and b/qnn/kv/layer_24_value_0.raw differ diff --git a/qnn/kv/layer_24_value_1.raw b/qnn/kv/layer_24_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..630f0a59b44202a594a417dcec621ce7a3b530bd Binary files /dev/null and b/qnn/kv/layer_24_value_1.raw differ diff --git a/qnn/kv/layer_25_key_0.raw b/qnn/kv/layer_25_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..06e2b2335eb6a2f795e76f371342bd2b3da2cd40 Binary files /dev/null and b/qnn/kv/layer_25_key_0.raw differ diff --git a/qnn/kv/layer_25_key_1.raw b/qnn/kv/layer_25_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..2cf675c6d9ea85c154a0c1012efb7ab4a01eaadf Binary files /dev/null and b/qnn/kv/layer_25_key_1.raw differ diff --git a/qnn/kv/layer_25_value_0.raw b/qnn/kv/layer_25_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..5485a8fb94413c2ccf3b6677cefa3c3ae9a5809f Binary files /dev/null and b/qnn/kv/layer_25_value_0.raw differ diff --git a/qnn/kv/layer_25_value_1.raw b/qnn/kv/layer_25_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..d20f3b7ec386cbade000572678d2c14db63dc579 Binary files /dev/null and b/qnn/kv/layer_25_value_1.raw differ diff --git a/qnn/kv/layer_26_key_0.raw b/qnn/kv/layer_26_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..b2462b3ddb66115f3ab128b1bb118b36aae91690 Binary files /dev/null and b/qnn/kv/layer_26_key_0.raw differ diff --git a/qnn/kv/layer_26_key_1.raw b/qnn/kv/layer_26_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..a4023832cbd22873c0a53dc798a23740f523cce4 Binary files /dev/null and b/qnn/kv/layer_26_key_1.raw differ diff --git a/qnn/kv/layer_26_value_0.raw b/qnn/kv/layer_26_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..4348ff2bc7f465c4374aa2f0cd38784d7343aedb Binary files /dev/null and b/qnn/kv/layer_26_value_0.raw differ diff --git a/qnn/kv/layer_26_value_1.raw b/qnn/kv/layer_26_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..84032a08783d21ada635dd0aa0c0d32da45eeb5f Binary files /dev/null and b/qnn/kv/layer_26_value_1.raw differ diff --git a/qnn/kv/layer_27_key_0.raw b/qnn/kv/layer_27_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..f955cf10c2fd8c5b3ad1bc38f07d2acf59815419 Binary files /dev/null and b/qnn/kv/layer_27_key_0.raw differ diff --git a/qnn/kv/layer_27_key_1.raw b/qnn/kv/layer_27_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..82a9095d9fb9d36e0a74f66d22d6f3bafeb56974 Binary files /dev/null and b/qnn/kv/layer_27_key_1.raw differ diff --git a/qnn/kv/layer_27_value_0.raw b/qnn/kv/layer_27_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..35c6c09d7514e433077cceb5f87a0f53d529048b Binary files /dev/null and b/qnn/kv/layer_27_value_0.raw differ diff --git a/qnn/kv/layer_27_value_1.raw b/qnn/kv/layer_27_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..8c1fbe02217ee728ee7a0b4134566a7a6b5008ae Binary files /dev/null and b/qnn/kv/layer_27_value_1.raw differ diff --git a/qnn/kv/layer_28_key_0.raw b/qnn/kv/layer_28_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..86eb694b82901a21376c0ed5128b6585c8294d65 Binary files /dev/null and b/qnn/kv/layer_28_key_0.raw differ diff --git a/qnn/kv/layer_28_key_1.raw b/qnn/kv/layer_28_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..a6a2e06b389d5e90d724c246db2b0383c4e6b959 Binary files /dev/null and b/qnn/kv/layer_28_key_1.raw differ diff --git a/qnn/kv/layer_28_value_0.raw b/qnn/kv/layer_28_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..bb1b5e614821e14100ef0c01d9f8f838fdb682fc Binary files /dev/null and b/qnn/kv/layer_28_value_0.raw differ diff --git a/qnn/kv/layer_28_value_1.raw b/qnn/kv/layer_28_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..573c43020232e092026e9c686decc85e0524156c Binary files /dev/null and b/qnn/kv/layer_28_value_1.raw differ diff --git a/qnn/kv/layer_29_key_0.raw b/qnn/kv/layer_29_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..4817f63dcedd5b69e0177470d663feb903eb04a8 Binary files /dev/null and b/qnn/kv/layer_29_key_0.raw differ diff --git a/qnn/kv/layer_29_key_1.raw b/qnn/kv/layer_29_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..f76963e22f212f3444570b23a528e96da82a9a12 Binary files /dev/null and b/qnn/kv/layer_29_key_1.raw differ diff --git a/qnn/kv/layer_29_value_0.raw b/qnn/kv/layer_29_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..a7594807f7c0b20736a615857189d59049cb968c Binary files /dev/null and b/qnn/kv/layer_29_value_0.raw differ diff --git a/qnn/kv/layer_29_value_1.raw b/qnn/kv/layer_29_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..6edd97df83be6f922bce73174f6df9c945bd5fff Binary files /dev/null and b/qnn/kv/layer_29_value_1.raw differ diff --git a/qnn/kv/layer_2_key_0.raw b/qnn/kv/layer_2_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..ab1794c68c673450c57b903f2afc39704092a0bb Binary files /dev/null and b/qnn/kv/layer_2_key_0.raw differ diff --git a/qnn/kv/layer_2_key_1.raw b/qnn/kv/layer_2_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..d79244cadc121b2b43c752f4e7f57163dac4ec3c Binary files /dev/null and b/qnn/kv/layer_2_key_1.raw differ diff --git a/qnn/kv/layer_2_value_0.raw b/qnn/kv/layer_2_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..a1b7e0424f5333d86223d7e1e15e3ca2633be5ba Binary files /dev/null and b/qnn/kv/layer_2_value_0.raw differ diff --git a/qnn/kv/layer_2_value_1.raw b/qnn/kv/layer_2_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..99c53b312e3adf20abf601610ee695358ce9ecde Binary files /dev/null and b/qnn/kv/layer_2_value_1.raw differ diff --git a/qnn/kv/layer_30_key_0.raw b/qnn/kv/layer_30_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..7c634a2027b9d43b54d2b5ab937aca2e180088fc Binary files /dev/null and b/qnn/kv/layer_30_key_0.raw differ diff --git a/qnn/kv/layer_30_key_1.raw b/qnn/kv/layer_30_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..e6499f292368bb7e1f44dd1045359dfffb9b7197 Binary files /dev/null and b/qnn/kv/layer_30_key_1.raw differ diff --git a/qnn/kv/layer_30_value_0.raw b/qnn/kv/layer_30_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..b5de1e6b5c8bfc4e1b2d2737596dd95de9b0f3d3 Binary files /dev/null and b/qnn/kv/layer_30_value_0.raw differ diff --git a/qnn/kv/layer_30_value_1.raw b/qnn/kv/layer_30_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..2a86bd351b7f44ed4fb4bb40bf459fd1bae9cdb7 Binary files /dev/null and b/qnn/kv/layer_30_value_1.raw differ diff --git a/qnn/kv/layer_31_key_0.raw b/qnn/kv/layer_31_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..c04b2b13f8103df7b680e819702110193171a4f9 Binary files /dev/null and b/qnn/kv/layer_31_key_0.raw differ diff --git a/qnn/kv/layer_31_key_1.raw b/qnn/kv/layer_31_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..d740010596f2e0c3dc8722ad6a3f06cbfe3892aa Binary files /dev/null and b/qnn/kv/layer_31_key_1.raw differ diff --git a/qnn/kv/layer_31_value_0.raw b/qnn/kv/layer_31_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..de470e10e3ab18b64fee65454d099bc6191ee5bb Binary files /dev/null and b/qnn/kv/layer_31_value_0.raw differ diff --git a/qnn/kv/layer_31_value_1.raw b/qnn/kv/layer_31_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..03d11520e99fad459e7a7ca867bd8292aa32d81e Binary files /dev/null and b/qnn/kv/layer_31_value_1.raw differ diff --git a/qnn/kv/layer_32_key_0.raw b/qnn/kv/layer_32_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..27133e80dd1d1feb91f0f893cd8047e3f8cb35bb Binary files /dev/null and b/qnn/kv/layer_32_key_0.raw differ diff --git a/qnn/kv/layer_32_key_1.raw b/qnn/kv/layer_32_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..e41936a039aaf946ad95da437ee4adb0b11fe3bc Binary files /dev/null and b/qnn/kv/layer_32_key_1.raw differ diff --git a/qnn/kv/layer_32_value_0.raw b/qnn/kv/layer_32_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..e2d589fe16b6e812ebad151225da47bf232f8720 Binary files /dev/null and b/qnn/kv/layer_32_value_0.raw differ diff --git a/qnn/kv/layer_32_value_1.raw b/qnn/kv/layer_32_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..bef5c6e529f8410b17fe4b5adac8fdf7598ca9db Binary files /dev/null and b/qnn/kv/layer_32_value_1.raw differ diff --git a/qnn/kv/layer_33_key_0.raw b/qnn/kv/layer_33_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..28b351a9782926c1b078514a6fab77afb3e7a942 Binary files /dev/null and b/qnn/kv/layer_33_key_0.raw differ diff --git a/qnn/kv/layer_33_key_1.raw b/qnn/kv/layer_33_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..20dd05cabd7d6cb666f7fa5599585edd805b1bb0 Binary files /dev/null and b/qnn/kv/layer_33_key_1.raw differ diff --git a/qnn/kv/layer_33_value_0.raw b/qnn/kv/layer_33_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..eb0b7fa24049588ec557c65302aea8b58968190f Binary files /dev/null and b/qnn/kv/layer_33_value_0.raw differ diff --git a/qnn/kv/layer_33_value_1.raw b/qnn/kv/layer_33_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..eb2651894875b29a574e6a5f04669f0923a63d0a Binary files /dev/null and b/qnn/kv/layer_33_value_1.raw differ diff --git a/qnn/kv/layer_34_key_0.raw b/qnn/kv/layer_34_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..994748f838337cb8b333e0f01f0c59229dee37d5 Binary files /dev/null and b/qnn/kv/layer_34_key_0.raw differ diff --git a/qnn/kv/layer_34_key_1.raw b/qnn/kv/layer_34_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..17d4a3d260f3a04c188e83fcd5367f42a6622ae9 Binary files /dev/null and b/qnn/kv/layer_34_key_1.raw differ diff --git a/qnn/kv/layer_34_value_0.raw b/qnn/kv/layer_34_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..f95a07b49be06847d053ce3eeecfe70dc7e882b1 Binary files /dev/null and b/qnn/kv/layer_34_value_0.raw differ diff --git a/qnn/kv/layer_34_value_1.raw b/qnn/kv/layer_34_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..c1ec15385f0a683e845be3dc7cb75e720f815f4f Binary files /dev/null and b/qnn/kv/layer_34_value_1.raw differ diff --git a/qnn/kv/layer_35_key_0.raw b/qnn/kv/layer_35_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..09ff773db42b360c2f786d880bf020a134d3685b Binary files /dev/null and b/qnn/kv/layer_35_key_0.raw differ diff --git a/qnn/kv/layer_35_key_1.raw b/qnn/kv/layer_35_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..b6dbe3d675ad6be97ae0bc3ef1d04d50146b99d3 Binary files /dev/null and b/qnn/kv/layer_35_key_1.raw differ diff --git a/qnn/kv/layer_35_value_0.raw b/qnn/kv/layer_35_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..5aad74d3520607ea6a7fab0c9d7ac723b696ff48 Binary files /dev/null and b/qnn/kv/layer_35_value_0.raw differ diff --git a/qnn/kv/layer_35_value_1.raw b/qnn/kv/layer_35_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..7cc7bd58e11bc6ca2723c393071d63f4b133020d Binary files /dev/null and b/qnn/kv/layer_35_value_1.raw differ diff --git a/qnn/kv/layer_3_key_0.raw b/qnn/kv/layer_3_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..65e5e0dbc67cfe4bfb1f0ff3f4305855ecf67dc2 Binary files /dev/null and b/qnn/kv/layer_3_key_0.raw differ diff --git a/qnn/kv/layer_3_key_1.raw b/qnn/kv/layer_3_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..049ff0d6eae86784362a203609f280b40f1a14f2 Binary files /dev/null and b/qnn/kv/layer_3_key_1.raw differ diff --git a/qnn/kv/layer_3_value_0.raw b/qnn/kv/layer_3_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..e20022af7127a004a649ab54765d7f84e861b2e4 Binary files /dev/null and b/qnn/kv/layer_3_value_0.raw differ diff --git a/qnn/kv/layer_3_value_1.raw b/qnn/kv/layer_3_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..4dfd7cf2ff67d7c0c5a6119dd9cffc183ed395c5 Binary files /dev/null and b/qnn/kv/layer_3_value_1.raw differ diff --git a/qnn/kv/layer_4_key_0.raw b/qnn/kv/layer_4_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..aa9559b0570326577c569e3ba14a9b25a2c23b75 Binary files /dev/null and b/qnn/kv/layer_4_key_0.raw differ diff --git a/qnn/kv/layer_4_key_1.raw b/qnn/kv/layer_4_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..70427ab865cc84c12e45465095fd7c246b81d169 Binary files /dev/null and b/qnn/kv/layer_4_key_1.raw differ diff --git a/qnn/kv/layer_4_value_0.raw b/qnn/kv/layer_4_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..b7d9fc9a74ff905b5fe41295cfed372055b315a4 Binary files /dev/null and b/qnn/kv/layer_4_value_0.raw differ diff --git a/qnn/kv/layer_4_value_1.raw b/qnn/kv/layer_4_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..569702972228d2ce353e90a74d413725ea3215f1 Binary files /dev/null and b/qnn/kv/layer_4_value_1.raw differ diff --git a/qnn/kv/layer_5_key_0.raw b/qnn/kv/layer_5_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..bd6877fe5aa36e954a06c5f0ec34b85e42d3775d Binary files /dev/null and b/qnn/kv/layer_5_key_0.raw differ diff --git a/qnn/kv/layer_5_key_1.raw b/qnn/kv/layer_5_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..ff384cc7017914619b1ab7c7dcdc59908ff63ed2 Binary files /dev/null and b/qnn/kv/layer_5_key_1.raw differ diff --git a/qnn/kv/layer_5_value_0.raw b/qnn/kv/layer_5_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..25c41a4ef43702f9bee1029e95d6a57b0d01123a Binary files /dev/null and b/qnn/kv/layer_5_value_0.raw differ diff --git a/qnn/kv/layer_5_value_1.raw b/qnn/kv/layer_5_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..e5479ba4e096c5ccc321cc05abec18cfdd6004aa Binary files /dev/null and b/qnn/kv/layer_5_value_1.raw differ diff --git a/qnn/kv/layer_6_key_0.raw b/qnn/kv/layer_6_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..706fa090156a8265dcfe1bee91e0eff63fc6c724 Binary files /dev/null and b/qnn/kv/layer_6_key_0.raw differ diff --git a/qnn/kv/layer_6_key_1.raw b/qnn/kv/layer_6_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..0469ae69a21b775707ddd2471668f2fd2e7c84a1 Binary files /dev/null and b/qnn/kv/layer_6_key_1.raw differ diff --git a/qnn/kv/layer_6_value_0.raw b/qnn/kv/layer_6_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..7cd962347babf6612555f1870cd675dbd28c0d3a Binary files /dev/null and b/qnn/kv/layer_6_value_0.raw differ diff --git a/qnn/kv/layer_6_value_1.raw b/qnn/kv/layer_6_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..f99d7517fece99742209f5d6d15a2e3b6ee889b4 Binary files /dev/null and b/qnn/kv/layer_6_value_1.raw differ diff --git a/qnn/kv/layer_7_key_0.raw b/qnn/kv/layer_7_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..8d9e8f2d105d76407fe19b5466537cb8f6d48c42 Binary files /dev/null and b/qnn/kv/layer_7_key_0.raw differ diff --git a/qnn/kv/layer_7_key_1.raw b/qnn/kv/layer_7_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..f008eda7599fd4ac2c21721d81213d29ed921ce1 Binary files /dev/null and b/qnn/kv/layer_7_key_1.raw differ diff --git a/qnn/kv/layer_7_value_0.raw b/qnn/kv/layer_7_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..79fdf8c1d2d474f3930dd22cc4461ab783a219bd Binary files /dev/null and b/qnn/kv/layer_7_value_0.raw differ diff --git a/qnn/kv/layer_7_value_1.raw b/qnn/kv/layer_7_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..9a2012e80375d21d04801cd3fed796ad148aa117 Binary files /dev/null and b/qnn/kv/layer_7_value_1.raw differ diff --git a/qnn/kv/layer_8_key_0.raw b/qnn/kv/layer_8_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..029e282b1273d87b2980ffae3f3e6872fdd7e47f Binary files /dev/null and b/qnn/kv/layer_8_key_0.raw differ diff --git a/qnn/kv/layer_8_key_1.raw b/qnn/kv/layer_8_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..c809f6d069e8d61c33344beb2ec5be6bf8ce58ae Binary files /dev/null and b/qnn/kv/layer_8_key_1.raw differ diff --git a/qnn/kv/layer_8_value_0.raw b/qnn/kv/layer_8_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..eacf4aa9cb1f75b76229ee0cf65f8c29df29d98c Binary files /dev/null and b/qnn/kv/layer_8_value_0.raw differ diff --git a/qnn/kv/layer_8_value_1.raw b/qnn/kv/layer_8_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..31956c3a687068e61f8958e201324d6d522f5d1a Binary files /dev/null and b/qnn/kv/layer_8_value_1.raw differ diff --git a/qnn/kv/layer_9_key_0.raw b/qnn/kv/layer_9_key_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..2518e18621f790235dcef98aaf0db76334820df9 Binary files /dev/null and b/qnn/kv/layer_9_key_0.raw differ diff --git a/qnn/kv/layer_9_key_1.raw b/qnn/kv/layer_9_key_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..46a0078d47882d72ccc7df9b286e5a2a18e568b0 Binary files /dev/null and b/qnn/kv/layer_9_key_1.raw differ diff --git a/qnn/kv/layer_9_value_0.raw b/qnn/kv/layer_9_value_0.raw new file mode 100644 index 0000000000000000000000000000000000000000..f36ee9593190b1e88c2e18fc5f3a23bfb531ffaf Binary files /dev/null and b/qnn/kv/layer_9_value_0.raw differ diff --git a/qnn/kv/layer_9_value_1.raw b/qnn/kv/layer_9_value_1.raw new file mode 100644 index 0000000000000000000000000000000000000000..a907642bad1bbdc2bc190fa358f8a1bd7eb5f6f3 Binary files /dev/null and b/qnn/kv/layer_9_value_1.raw differ diff --git a/qnn/lm_head.bin b/qnn/lm_head.bin new file mode 100644 index 0000000000000000000000000000000000000000..ece6358f8967eaa9ab8fad48226ab79731428fa8 --- /dev/null +++ b/qnn/lm_head.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05631eb647ccbdfe017624c0322f66923ea8051e52b5b53bb76ff1538eefe7a0 +size 163965312 diff --git a/qnn/qwen2.5_3b_0.bin b/qnn/qwen2.5_3b_0.bin new file mode 100644 index 0000000000000000000000000000000000000000..4d635a3c5bf11ce8a153e81d5a875446ce6b5893 --- /dev/null +++ b/qnn/qwen2.5_3b_0.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dd4c34eac9291e59553fb86dd9f44795ee4c21331244f629ef416234e42c116 +size 1074006168 diff --git a/qnn/qwen2.5_3b_1.bin b/qnn/qwen2.5_3b_1.bin new file mode 100644 index 0000000000000000000000000000000000000000..0d757234cfc8ce76a088b15ac5af844d206df3ec --- /dev/null +++ b/qnn/qwen2.5_3b_1.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c4becd6dd91e7cb0c6618fa94d66aed26c6b1c479302f56a1fcc23411a39803 +size 1098870184 diff --git a/vocab.gguf b/vocab.gguf new file mode 100644 index 0000000000000000000000000000000000000000..2cc819bb07f0f8ccd76c510cead0b5d3f837b564 --- /dev/null +++ b/vocab.gguf @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f548d3c24e1883f889ce32a4d566e37f91fc38947b2c451469676fecc2865226 +size 5929071