llmmlman commited on
Commit
435077c
·
verified ·
1 Parent(s): e8558a4

Update qnn/config.json

Browse files
Files changed (1) hide show
  1. qnn/config.json +8 -8
qnn/config.json CHANGED
@@ -23,7 +23,7 @@
23
  "cache_size": 3968,
24
  "context_size": 4096,
25
  "graph_name": "batch_1",
26
- "model_path": "llama3_1_8b_0.bin",
27
  "kv_path_format": "kv/layer_{layer_id}_{kv_type}_{head_id}.raw",
28
  "kv_size": 1,
29
  "x_name": "x",
@@ -37,7 +37,7 @@
37
  "cache_size": 3968,
38
  "context_size": 4096,
39
  "graph_name": "batch_1",
40
- "model_path": "llama3_1_8b_1.bin",
41
  "kv_path_format": "kv/layer_{layer_id}_{kv_type}_{head_id}.raw",
42
  "kv_size": 1,
43
  "x_name": "x",
@@ -51,7 +51,7 @@
51
  "cache_size": 3968,
52
  "context_size": 4096,
53
  "graph_name": "batch_1",
54
- "model_path": "llama3_1_8b_2.bin",
55
  "kv_path_format": "kv/layer_{layer_id}_{kv_type}_{head_id}.raw",
56
  "kv_size": 1,
57
  "x_name": "x",
@@ -65,7 +65,7 @@
65
  "cache_size": 3968,
66
  "context_size": 4096,
67
  "graph_name": "batch_1",
68
- "model_path": "llama3_1_8b_3.bin",
69
  "kv_path_format": "kv/layer_{layer_id}_{kv_type}_{head_id}.raw",
70
  "kv_size": 1,
71
  "x_name": "x",
@@ -79,7 +79,7 @@
79
  "cache_size": 3968,
80
  "context_size": 4096,
81
  "graph_name": "batch_128",
82
- "model_path": "llama3_1_8b_0.bin",
83
  "kv_path_format": "kv/layer_{layer_id}_{kv_type}_{head_id}.raw",
84
  "kv_size": 1,
85
  "x_name": "x",
@@ -93,7 +93,7 @@
93
  "cache_size": 3968,
94
  "context_size": 4096,
95
  "graph_name": "batch_128",
96
- "model_path": "llama3_1_8b_1.bin",
97
  "kv_path_format": "kv/layer_{layer_id}_{kv_type}_{head_id}.raw",
98
  "kv_size": 1,
99
  "x_name": "x",
@@ -107,7 +107,7 @@
107
  "cache_size": 3968,
108
  "context_size": 4096,
109
  "graph_name": "batch_128",
110
- "model_path": "llama3_1_8b_2.bin",
111
  "kv_path_format": "kv/layer_{layer_id}_{kv_type}_{head_id}.raw",
112
  "kv_size": 1,
113
  "x_name": "x",
@@ -121,7 +121,7 @@
121
  "cache_size": 3968,
122
  "context_size": 4096,
123
  "graph_name": "batch_128",
124
- "model_path": "llama3_1_8b_3.bin",
125
  "kv_path_format": "kv/layer_{layer_id}_{kv_type}_{head_id}.raw",
126
  "kv_size": 1,
127
  "x_name": "x",
 
23
  "cache_size": 3968,
24
  "context_size": 4096,
25
  "graph_name": "batch_1",
26
+ "model_path": "deepseek_r1_distill_llama_8b_0.bin",
27
  "kv_path_format": "kv/layer_{layer_id}_{kv_type}_{head_id}.raw",
28
  "kv_size": 1,
29
  "x_name": "x",
 
37
  "cache_size": 3968,
38
  "context_size": 4096,
39
  "graph_name": "batch_1",
40
+ "model_path": "deepseek_r1_distill_llama_8b_1.bin",
41
  "kv_path_format": "kv/layer_{layer_id}_{kv_type}_{head_id}.raw",
42
  "kv_size": 1,
43
  "x_name": "x",
 
51
  "cache_size": 3968,
52
  "context_size": 4096,
53
  "graph_name": "batch_1",
54
+ "model_path": "deepseek_r1_distill_llama_8b_2.bin",
55
  "kv_path_format": "kv/layer_{layer_id}_{kv_type}_{head_id}.raw",
56
  "kv_size": 1,
57
  "x_name": "x",
 
65
  "cache_size": 3968,
66
  "context_size": 4096,
67
  "graph_name": "batch_1",
68
+ "model_path": "deepseek_r1_distill_llama_8b_3.bin",
69
  "kv_path_format": "kv/layer_{layer_id}_{kv_type}_{head_id}.raw",
70
  "kv_size": 1,
71
  "x_name": "x",
 
79
  "cache_size": 3968,
80
  "context_size": 4096,
81
  "graph_name": "batch_128",
82
+ "model_path": "deepseek_r1_distill_llama_8b_0.bin",
83
  "kv_path_format": "kv/layer_{layer_id}_{kv_type}_{head_id}.raw",
84
  "kv_size": 1,
85
  "x_name": "x",
 
93
  "cache_size": 3968,
94
  "context_size": 4096,
95
  "graph_name": "batch_128",
96
+ "model_path": "deepseek_r1_distill_llama_8b_1.bin",
97
  "kv_path_format": "kv/layer_{layer_id}_{kv_type}_{head_id}.raw",
98
  "kv_size": 1,
99
  "x_name": "x",
 
107
  "cache_size": 3968,
108
  "context_size": 4096,
109
  "graph_name": "batch_128",
110
+ "model_path": "deepseek_r1_distill_llama_8b_2.bin",
111
  "kv_path_format": "kv/layer_{layer_id}_{kv_type}_{head_id}.raw",
112
  "kv_size": 1,
113
  "x_name": "x",
 
121
  "cache_size": 3968,
122
  "context_size": 4096,
123
  "graph_name": "batch_128",
124
+ "model_path": "deepseek_r1_distill_llama_8b_3.bin",
125
  "kv_path_format": "kv/layer_{layer_id}_{kv_type}_{head_id}.raw",
126
  "kv_size": 1,
127
  "x_name": "x",