iproskurina commited on
Commit
f60ab19
·
verified ·
1 Parent(s): cbf0a4a

Add files using upload-large-folder tool

Browse files
Files changed (2) hide show
  1. model.safetensors +1 -1
  2. quant_log.csv +196 -196
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:00f7c4d9a1f659366f65d5fb99ca7b6f2da6da0d6b74ae8128d4249cde3aae08
3
  size 2255767328
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c39cf80182cd44a4517c067951857427c1013ff5da1029b810f755bf0c19a530
3
  size 2255767328
quant_log.csv CHANGED
@@ -1,197 +1,197 @@
1
  layer,module,loss,samples,damp,time
2
- 0,self_attn.k_proj,0.30112195,0.01000,1.150
3
- 0,self_attn.v_proj,0.01570884,0.01000,1.133
4
- 0,self_attn.q_proj,0.59113240,0.01000,1.155
5
- 0,self_attn.o_proj,0.00065421,0.01000,1.159
6
- 0,mlp.up_proj,0.37343988,0.01000,1.144
7
- 0,mlp.gate_proj,0.42701188,0.01000,1.160
8
- 0,mlp.down_proj,0.00581118,0.01000,3.120
9
- 1,self_attn.k_proj,0.38888621,0.01000,1.147
10
- 1,self_attn.v_proj,0.04474297,0.01000,1.126
11
- 1,self_attn.q_proj,0.66478097,0.01000,1.175
12
- 1,self_attn.o_proj,0.00249097,0.01000,1.147
13
- 1,mlp.up_proj,0.52243674,0.01000,1.149
14
- 1,mlp.gate_proj,0.59576809,0.01000,1.154
15
- 1,mlp.down_proj,0.06515677,0.01000,3.167
16
- 2,self_attn.k_proj,1.88801134,0.01000,1.123
17
- 2,self_attn.v_proj,0.19233426,0.01000,1.127
18
- 2,self_attn.q_proj,3.18083096,0.01000,1.152
19
- 2,self_attn.o_proj,0.00320804,0.01000,1.135
20
- 2,mlp.up_proj,0.82030928,0.01000,1.164
21
- 2,mlp.gate_proj,0.96838230,0.01000,1.149
22
- 2,mlp.down_proj,0.01880076,0.01000,3.121
23
- 3,self_attn.k_proj,1.22175431,0.01000,1.168
24
- 3,self_attn.v_proj,0.21496563,0.01000,1.144
25
- 3,self_attn.q_proj,2.22663021,0.01000,1.159
26
- 3,self_attn.o_proj,0.00706171,0.01000,1.162
27
- 3,mlp.up_proj,1.06836176,0.01000,1.169
28
- 3,mlp.gate_proj,1.42266273,0.01000,1.178
29
- 3,mlp.down_proj,0.02924869,0.01000,3.214
30
- 4,self_attn.k_proj,1.15004706,0.01000,1.127
31
- 4,self_attn.v_proj,0.22012554,0.01000,1.155
32
- 4,self_attn.q_proj,2.19098425,0.01000,1.161
33
- 4,self_attn.o_proj,0.01024623,0.01000,1.158
34
- 4,mlp.up_proj,1.26271689,0.01000,1.149
35
- 4,mlp.gate_proj,1.88262272,0.01000,1.154
36
- 4,mlp.down_proj,0.04099274,0.01000,3.204
37
- 5,self_attn.k_proj,1.86057818,0.01000,1.155
38
- 5,self_attn.v_proj,0.22285002,0.01000,1.134
39
- 5,self_attn.q_proj,3.10485601,0.01000,1.180
40
- 5,self_attn.o_proj,0.01251093,0.01000,1.143
41
- 5,mlp.up_proj,1.46818447,0.01000,1.146
42
- 5,mlp.gate_proj,2.07031012,0.01000,1.169
43
- 5,mlp.down_proj,0.05284793,0.01000,3.139
44
- 6,self_attn.k_proj,1.41580844,0.01000,1.122
45
- 6,self_attn.v_proj,0.21924368,0.01000,1.158
46
- 6,self_attn.q_proj,2.65340567,0.01000,1.147
47
- 6,self_attn.o_proj,0.01863250,0.01000,1.138
48
- 6,mlp.up_proj,1.53119409,0.01000,1.164
49
- 6,mlp.gate_proj,2.13722944,0.01000,1.171
50
- 6,mlp.down_proj,0.05822247,0.01000,3.178
51
- 7,self_attn.k_proj,1.33923364,0.01000,1.145
52
- 7,self_attn.v_proj,0.19492055,0.01000,1.125
53
- 7,self_attn.q_proj,2.26367903,0.01000,1.146
54
- 7,self_attn.o_proj,0.02339792,0.01000,1.152
55
- 7,mlp.up_proj,1.61240244,0.01000,1.144
56
- 7,mlp.gate_proj,2.06814051,0.01000,1.140
57
- 7,mlp.down_proj,0.06485046,0.01000,3.188
58
- 8,self_attn.k_proj,1.72186375,0.01000,1.141
59
- 8,self_attn.v_proj,0.24632689,0.01000,1.135
60
- 8,self_attn.q_proj,2.87150645,0.01000,1.164
61
- 8,self_attn.o_proj,0.03228246,0.01000,1.145
62
- 8,mlp.up_proj,1.66218758,0.01000,1.159
63
- 8,mlp.gate_proj,2.17076254,0.01000,1.185
64
- 8,mlp.down_proj,0.06700595,0.01000,3.180
65
- 9,self_attn.k_proj,1.63053393,0.01000,1.151
66
- 9,self_attn.v_proj,0.29964578,0.01000,1.148
67
- 9,self_attn.q_proj,2.75603867,0.01000,1.159
68
- 9,self_attn.o_proj,0.03246364,0.01000,1.158
69
- 9,mlp.up_proj,1.66436744,0.01000,1.139
70
- 9,mlp.gate_proj,2.09544492,0.01000,1.164
71
- 9,mlp.down_proj,0.06654672,0.01000,3.110
72
- 10,self_attn.k_proj,1.71625137,0.01000,1.417
73
- 10,self_attn.v_proj,0.23680860,0.01000,1.134
74
- 10,self_attn.q_proj,2.78978491,0.01000,1.153
75
- 10,self_attn.o_proj,0.02899919,0.01000,1.181
76
- 10,mlp.up_proj,1.76738119,0.01000,1.148
77
- 10,mlp.gate_proj,2.07832718,0.01000,1.183
78
- 10,mlp.down_proj,0.07146379,0.01000,3.131
79
- 11,self_attn.k_proj,1.32459235,0.01000,1.141
80
- 11,self_attn.v_proj,0.28146595,0.01000,1.131
81
- 11,self_attn.q_proj,2.36020613,0.01000,1.178
82
- 11,self_attn.o_proj,0.03698180,0.01000,1.160
83
- 11,mlp.up_proj,1.90443850,0.01000,1.184
84
- 11,mlp.gate_proj,2.15822124,0.01000,1.158
85
- 11,mlp.down_proj,0.08127841,0.01000,3.138
86
- 12,self_attn.k_proj,1.97247875,0.01000,1.150
87
- 12,self_attn.v_proj,0.30387902,0.01000,1.127
88
- 12,self_attn.q_proj,3.29090500,0.01000,1.136
89
- 12,self_attn.o_proj,0.04466573,0.01000,1.132
90
- 12,mlp.up_proj,2.00009823,0.01000,1.146
91
- 12,mlp.gate_proj,2.24844861,0.01000,1.147
92
- 12,mlp.down_proj,0.09179184,0.01000,3.251
93
- 13,self_attn.k_proj,2.20049191,0.01000,1.158
94
- 13,self_attn.v_proj,0.34632075,0.01000,1.159
95
- 13,self_attn.q_proj,3.41837978,0.01000,1.149
96
- 13,self_attn.o_proj,0.04902930,0.01000,1.135
97
- 13,mlp.up_proj,2.17827463,0.01000,1.148
98
- 13,mlp.gate_proj,2.59816766,0.01000,1.159
99
- 13,mlp.down_proj,0.11659020,0.01000,3.148
100
- 14,self_attn.k_proj,1.75478387,0.01000,1.114
101
- 14,self_attn.v_proj,0.39836311,0.01000,1.127
102
- 14,self_attn.q_proj,3.66679001,0.01000,1.154
103
- 14,self_attn.o_proj,0.06044153,0.01000,1.145
104
- 14,mlp.up_proj,2.32195139,0.01000,1.181
105
- 14,mlp.gate_proj,2.79072547,0.01000,1.158
106
- 14,mlp.down_proj,0.14615875,0.01000,3.236
107
- 15,self_attn.k_proj,2.02502155,0.01000,1.166
108
- 15,self_attn.v_proj,0.40373188,0.01000,1.135
109
- 15,self_attn.q_proj,3.85390139,0.01000,1.183
110
- 15,self_attn.o_proj,0.04099876,0.01000,1.126
111
- 15,mlp.up_proj,2.39323020,0.01000,1.162
112
- 15,mlp.gate_proj,3.09810781,0.01000,1.154
113
- 15,mlp.down_proj,0.15945630,0.01000,3.149
114
- 16,self_attn.k_proj,2.24789000,0.01000,1.133
115
- 16,self_attn.v_proj,0.44044137,0.01000,1.151
116
- 16,self_attn.q_proj,3.99555898,0.01000,1.159
117
- 16,self_attn.o_proj,0.03019350,0.01000,1.142
118
- 16,mlp.up_proj,2.44461060,0.01000,1.168
119
- 16,mlp.gate_proj,3.25726128,0.01000,1.187
120
- 16,mlp.down_proj,0.15433976,0.01000,3.161
121
- 17,self_attn.k_proj,2.09545541,0.01000,1.135
122
- 17,self_attn.v_proj,0.43348342,0.01000,1.147
123
- 17,self_attn.q_proj,3.85930681,0.01000,1.158
124
- 17,self_attn.o_proj,0.02748003,0.01000,1.158
125
- 17,mlp.up_proj,2.53550029,0.01000,1.169
126
- 17,mlp.gate_proj,3.43495655,0.01000,1.159
127
- 17,mlp.down_proj,0.16544822,0.01000,3.143
128
- 18,self_attn.k_proj,2.36760187,0.01000,1.130
129
- 18,self_attn.v_proj,0.52266914,0.01000,1.162
130
- 18,self_attn.q_proj,4.23445797,0.01000,1.209
131
- 18,self_attn.o_proj,0.02904772,0.01000,1.162
132
- 18,mlp.up_proj,2.71687889,0.01000,1.134
133
- 18,mlp.gate_proj,3.60506201,0.01000,1.156
134
- 18,mlp.down_proj,0.17471251,0.01000,3.190
135
- 19,self_attn.k_proj,2.20339632,0.01000,1.139
136
- 19,self_attn.v_proj,0.52427340,0.01000,1.139
137
- 19,self_attn.q_proj,3.82244349,0.01000,1.155
138
- 19,self_attn.o_proj,0.04299172,0.01000,1.140
139
- 19,mlp.up_proj,2.92481565,0.01000,1.177
140
- 19,mlp.gate_proj,3.81721783,0.01000,1.208
141
- 19,mlp.down_proj,0.21938494,0.01000,3.164
142
- 20,self_attn.k_proj,2.38230228,0.01000,1.118
143
- 20,self_attn.v_proj,0.61960191,0.01000,1.130
144
- 20,self_attn.q_proj,3.94168520,0.01000,1.157
145
- 20,self_attn.o_proj,0.04088939,0.01000,1.155
146
- 20,mlp.up_proj,2.98803997,0.01000,1.153
147
- 20,mlp.gate_proj,3.73036146,0.01000,1.159
148
- 20,mlp.down_proj,0.22134039,0.01000,3.196
149
- 21,self_attn.k_proj,2.30610347,0.01000,1.144
150
- 21,self_attn.v_proj,0.79631335,0.01000,1.157
151
- 21,self_attn.q_proj,3.86093950,0.01000,1.146
152
- 21,self_attn.o_proj,0.04069402,0.01000,1.137
153
- 21,mlp.up_proj,3.20080495,0.01000,1.162
154
- 21,mlp.gate_proj,4.03069019,0.01000,1.178
155
- 21,mlp.down_proj,0.23245370,0.01000,3.147
156
- 22,self_attn.k_proj,2.18278742,0.01000,1.205
157
- 22,self_attn.v_proj,0.80734658,0.01000,1.140
158
- 22,self_attn.q_proj,3.80389190,0.01000,1.150
159
- 22,self_attn.o_proj,0.03824257,0.01000,1.163
160
- 22,mlp.up_proj,3.45145941,0.01000,1.176
161
- 22,mlp.gate_proj,4.35514832,0.01000,1.148
162
- 22,mlp.down_proj,0.26078928,0.01000,3.145
163
- 23,self_attn.k_proj,2.32202196,0.01000,1.141
164
- 23,self_attn.v_proj,0.79082692,0.01000,1.164
165
- 23,self_attn.q_proj,3.77259874,0.01000,1.164
166
- 23,self_attn.o_proj,0.07018079,0.01000,1.126
167
- 23,mlp.up_proj,3.79414082,0.01000,1.163
168
- 23,mlp.gate_proj,5.01220703,0.01000,1.144
169
- 23,mlp.down_proj,0.31240845,0.01000,3.183
170
- 24,self_attn.k_proj,2.54174876,0.01000,1.144
171
- 24,self_attn.v_proj,1.12363541,0.01000,1.152
172
- 24,self_attn.q_proj,4.08204651,0.01000,1.160
173
- 24,self_attn.o_proj,0.07914403,0.01000,1.156
174
- 24,mlp.up_proj,4.27621031,0.01000,1.138
175
- 24,mlp.gate_proj,5.73402596,0.01000,1.154
176
- 24,mlp.down_proj,0.38886082,0.01000,3.174
177
- 25,self_attn.k_proj,2.08625603,0.01000,1.155
178
- 25,self_attn.v_proj,1.03544307,0.01000,1.145
179
- 25,self_attn.q_proj,4.05644989,0.01000,1.171
180
- 25,self_attn.o_proj,0.10321535,0.01000,1.178
181
- 25,mlp.up_proj,4.61544085,0.01000,1.144
182
- 25,mlp.gate_proj,6.17409420,0.01000,1.164
183
- 25,mlp.down_proj,0.52019978,0.01000,3.172
184
- 26,self_attn.k_proj,2.38002038,0.01000,1.156
185
- 26,self_attn.v_proj,1.40352118,0.01000,1.176
186
- 26,self_attn.q_proj,3.68223524,0.01000,1.157
187
- 26,self_attn.o_proj,0.16447946,0.01000,1.146
188
- 26,mlp.up_proj,4.85717821,0.01000,1.168
189
- 26,mlp.gate_proj,6.55735397,0.01000,1.165
190
- 26,mlp.down_proj,0.76687741,0.01000,3.129
191
- 27,self_attn.k_proj,1.65952611,0.01000,1.158
192
- 27,self_attn.v_proj,0.90589255,0.01000,1.190
193
- 27,self_attn.q_proj,2.93714190,0.01000,1.156
194
- 27,self_attn.o_proj,0.37936646,0.01000,1.164
195
- 27,mlp.up_proj,5.13470936,0.01000,1.161
196
- 27,mlp.gate_proj,6.15918636,0.01000,1.140
197
- 27,mlp.down_proj,1.88660908,0.01000,3.237
 
1
  layer,module,loss,samples,damp,time
2
+ 0,self_attn.k_proj,0.57348979,0.01000,1.101
3
+ 0,self_attn.v_proj,0.02992631,0.01000,1.083
4
+ 0,self_attn.q_proj,1.12482524,0.01000,1.095
5
+ 0,self_attn.o_proj,0.00123981,0.01000,1.088
6
+ 0,mlp.up_proj,0.71145487,0.01000,1.110
7
+ 0,mlp.gate_proj,0.81329715,0.01000,1.129
8
+ 0,mlp.down_proj,0.01093513,0.01000,3.119
9
+ 1,self_attn.k_proj,0.74367076,0.01000,1.122
10
+ 1,self_attn.v_proj,0.08594101,0.01000,1.106
11
+ 1,self_attn.q_proj,1.27566791,0.01000,1.114
12
+ 1,self_attn.o_proj,0.00476055,0.01000,1.105
13
+ 1,mlp.up_proj,0.99940991,0.01000,1.137
14
+ 1,mlp.gate_proj,1.13917911,0.01000,1.131
15
+ 1,mlp.down_proj,0.12524097,0.01000,3.134
16
+ 2,self_attn.k_proj,3.61536407,0.01000,1.099
17
+ 2,self_attn.v_proj,0.36897749,0.01000,1.096
18
+ 2,self_attn.q_proj,6.09369278,0.01000,1.125
19
+ 2,self_attn.o_proj,0.00595129,0.01000,1.123
20
+ 2,mlp.up_proj,1.57945013,0.01000,1.193
21
+ 2,mlp.gate_proj,1.86483383,0.01000,1.140
22
+ 2,mlp.down_proj,0.03576290,0.01000,3.141
23
+ 3,self_attn.k_proj,2.34764647,0.01000,1.187
24
+ 3,self_attn.v_proj,0.41367924,0.01000,1.129
25
+ 3,self_attn.q_proj,4.28345490,0.01000,1.130
26
+ 3,self_attn.o_proj,0.01283259,0.01000,1.112
27
+ 3,mlp.up_proj,2.06658602,0.01000,1.146
28
+ 3,mlp.gate_proj,2.75131416,0.01000,1.137
29
+ 3,mlp.down_proj,0.05543867,0.01000,3.116
30
+ 4,self_attn.k_proj,2.20512915,0.01000,1.152
31
+ 4,self_attn.v_proj,0.42244333,0.01000,1.107
32
+ 4,self_attn.q_proj,4.19914150,0.01000,1.129
33
+ 4,self_attn.o_proj,0.01911609,0.01000,1.133
34
+ 4,mlp.up_proj,2.42648292,0.01000,1.136
35
+ 4,mlp.gate_proj,3.61736584,0.01000,1.187
36
+ 4,mlp.down_proj,0.07793631,0.01000,3.147
37
+ 5,self_attn.k_proj,3.54735780,0.01000,1.106
38
+ 5,self_attn.v_proj,0.42594641,0.01000,1.106
39
+ 5,self_attn.q_proj,5.93417883,0.01000,1.122
40
+ 5,self_attn.o_proj,0.02330331,0.01000,1.122
41
+ 5,mlp.up_proj,2.81386232,0.01000,1.139
42
+ 5,mlp.gate_proj,3.96837521,0.01000,1.151
43
+ 5,mlp.down_proj,0.10042880,0.01000,3.100
44
+ 6,self_attn.k_proj,2.70604372,0.01000,1.122
45
+ 6,self_attn.v_proj,0.41878402,0.01000,1.100
46
+ 6,self_attn.q_proj,5.07468605,0.01000,1.164
47
+ 6,self_attn.o_proj,0.03428555,0.01000,1.130
48
+ 6,mlp.up_proj,2.92948699,0.01000,1.128
49
+ 6,mlp.gate_proj,4.09053612,0.01000,1.139
50
+ 6,mlp.down_proj,0.11020730,0.01000,3.142
51
+ 7,self_attn.k_proj,2.56192708,0.01000,1.105
52
+ 7,self_attn.v_proj,0.37280792,0.01000,1.113
53
+ 7,self_attn.q_proj,4.33243322,0.01000,1.117
54
+ 7,self_attn.o_proj,0.04311103,0.01000,1.124
55
+ 7,mlp.up_proj,3.09119558,0.01000,1.154
56
+ 7,mlp.gate_proj,3.96394897,0.01000,1.116
57
+ 7,mlp.down_proj,0.12291946,0.01000,3.111
58
+ 8,self_attn.k_proj,3.28836107,0.01000,1.114
59
+ 8,self_attn.v_proj,0.47108710,0.01000,1.112
60
+ 8,self_attn.q_proj,5.49438858,0.01000,1.126
61
+ 8,self_attn.o_proj,0.06026545,0.01000,1.109
62
+ 8,mlp.up_proj,3.16844177,0.01000,1.147
63
+ 8,mlp.gate_proj,4.13681126,0.01000,1.133
64
+ 8,mlp.down_proj,0.12639077,0.01000,3.141
65
+ 9,self_attn.k_proj,3.11001682,0.01000,1.147
66
+ 9,self_attn.v_proj,0.57155442,0.01000,1.130
67
+ 9,self_attn.q_proj,5.25478554,0.01000,1.176
68
+ 9,self_attn.o_proj,0.05964671,0.01000,1.164
69
+ 9,mlp.up_proj,3.15676737,0.01000,1.162
70
+ 9,mlp.gate_proj,3.97617245,0.01000,1.133
71
+ 9,mlp.down_proj,0.12478939,0.01000,3.119
72
+ 10,self_attn.k_proj,3.26966572,0.01000,1.131
73
+ 10,self_attn.v_proj,0.45004451,0.01000,1.112
74
+ 10,self_attn.q_proj,5.30321121,0.01000,1.142
75
+ 10,self_attn.o_proj,0.05341929,0.01000,1.132
76
+ 10,mlp.up_proj,3.35345793,0.01000,1.196
77
+ 10,mlp.gate_proj,3.94216251,0.01000,1.174
78
+ 10,mlp.down_proj,0.13452166,0.01000,3.080
79
+ 11,self_attn.k_proj,2.52076197,0.01000,1.152
80
+ 11,self_attn.v_proj,0.53631318,0.01000,1.116
81
+ 11,self_attn.q_proj,4.49594688,0.01000,1.112
82
+ 11,self_attn.o_proj,0.06898431,0.01000,1.122
83
+ 11,mlp.up_proj,3.61847162,0.01000,1.165
84
+ 11,mlp.gate_proj,4.10153961,0.01000,1.116
85
+ 11,mlp.down_proj,0.15326369,0.01000,3.086
86
+ 12,self_attn.k_proj,3.76040173,0.01000,1.128
87
+ 12,self_attn.v_proj,0.57905239,0.01000,1.176
88
+ 12,self_attn.q_proj,6.26392555,0.01000,1.107
89
+ 12,self_attn.o_proj,0.08288961,0.01000,1.122
90
+ 12,mlp.up_proj,3.79364228,0.01000,1.191
91
+ 12,mlp.gate_proj,4.26222324,0.01000,1.158
92
+ 12,mlp.down_proj,0.17245661,0.01000,3.106
93
+ 13,self_attn.k_proj,4.17454338,0.01000,1.124
94
+ 13,self_attn.v_proj,0.65613842,0.01000,1.129
95
+ 13,self_attn.q_proj,6.48309612,0.01000,1.112
96
+ 13,self_attn.o_proj,0.08975884,0.01000,1.105
97
+ 13,mlp.up_proj,4.12620115,0.01000,1.149
98
+ 13,mlp.gate_proj,4.92243528,0.01000,1.127
99
+ 13,mlp.down_proj,0.21988256,0.01000,3.108
100
+ 14,self_attn.k_proj,3.32866430,0.01000,1.136
101
+ 14,self_attn.v_proj,0.75655323,0.01000,1.097
102
+ 14,self_attn.q_proj,6.95757151,0.01000,1.134
103
+ 14,self_attn.o_proj,0.11242675,0.01000,1.145
104
+ 14,mlp.up_proj,4.40335560,0.01000,1.159
105
+ 14,mlp.gate_proj,5.29281664,0.01000,1.150
106
+ 14,mlp.down_proj,0.27417624,0.01000,3.150
107
+ 15,self_attn.k_proj,3.84503889,0.01000,1.148
108
+ 15,self_attn.v_proj,0.76655364,0.01000,1.103
109
+ 15,self_attn.q_proj,7.31272936,0.01000,1.137
110
+ 15,self_attn.o_proj,0.07379784,0.01000,1.101
111
+ 15,mlp.up_proj,4.55024004,0.01000,1.200
112
+ 15,mlp.gate_proj,5.88753128,0.01000,1.137
113
+ 15,mlp.down_proj,0.29958892,0.01000,3.079
114
+ 16,self_attn.k_proj,4.27809811,0.01000,1.117
115
+ 16,self_attn.v_proj,0.83709764,0.01000,1.134
116
+ 16,self_attn.q_proj,7.59177876,0.01000,1.126
117
+ 16,self_attn.o_proj,0.05505002,0.01000,1.109
118
+ 16,mlp.up_proj,4.66512632,0.01000,1.139
119
+ 16,mlp.gate_proj,6.21557331,0.01000,1.145
120
+ 16,mlp.down_proj,0.29199547,0.01000,3.142
121
+ 17,self_attn.k_proj,3.99537516,0.01000,1.133
122
+ 17,self_attn.v_proj,0.82619518,0.01000,1.118
123
+ 17,self_attn.q_proj,7.35900211,0.01000,1.123
124
+ 17,self_attn.o_proj,0.05116026,0.01000,1.113
125
+ 17,mlp.up_proj,4.85350800,0.01000,1.139
126
+ 17,mlp.gate_proj,6.57617331,0.01000,1.139
127
+ 17,mlp.down_proj,0.31245530,0.01000,3.110
128
+ 18,self_attn.k_proj,4.51366901,0.01000,1.136
129
+ 18,self_attn.v_proj,0.99721968,0.01000,1.102
130
+ 18,self_attn.q_proj,8.07002068,0.01000,1.129
131
+ 18,self_attn.o_proj,0.05473011,0.01000,1.106
132
+ 18,mlp.up_proj,5.22503281,0.01000,1.119
133
+ 18,mlp.gate_proj,6.93419027,0.01000,1.149
134
+ 18,mlp.down_proj,0.33353916,0.01000,3.098
135
+ 19,self_attn.k_proj,4.22218132,0.01000,1.162
136
+ 19,self_attn.v_proj,1.00496328,0.01000,1.149
137
+ 19,self_attn.q_proj,7.31388569,0.01000,1.129
138
+ 19,self_attn.o_proj,0.07915132,0.01000,1.183
139
+ 19,mlp.up_proj,5.62336969,0.01000,1.137
140
+ 19,mlp.gate_proj,7.33508205,0.01000,1.136
141
+ 19,mlp.down_proj,0.41691202,0.01000,3.145
142
+ 20,self_attn.k_proj,4.55664349,0.01000,1.113
143
+ 20,self_attn.v_proj,1.19031966,0.01000,1.136
144
+ 20,self_attn.q_proj,7.54975128,0.01000,1.128
145
+ 20,self_attn.o_proj,0.07554041,0.01000,1.119
146
+ 20,mlp.up_proj,5.75148487,0.01000,1.143
147
+ 20,mlp.gate_proj,7.17578554,0.01000,1.166
148
+ 20,mlp.down_proj,0.42174736,0.01000,3.105
149
+ 21,self_attn.k_proj,4.42211723,0.01000,1.173
150
+ 21,self_attn.v_proj,1.52764320,0.01000,1.114
151
+ 21,self_attn.q_proj,7.39887810,0.01000,1.135
152
+ 21,self_attn.o_proj,0.07596338,0.01000,1.121
153
+ 21,mlp.up_proj,6.17190742,0.01000,1.145
154
+ 21,mlp.gate_proj,7.76521111,0.01000,1.130
155
+ 21,mlp.down_proj,0.44396168,0.01000,3.123
156
+ 22,self_attn.k_proj,4.18366241,0.01000,1.106
157
+ 22,self_attn.v_proj,1.55225110,0.01000,1.110
158
+ 22,self_attn.q_proj,7.29905701,0.01000,1.152
159
+ 22,self_attn.o_proj,0.06833672,0.01000,1.134
160
+ 22,mlp.up_proj,6.65676212,0.01000,1.178
161
+ 22,mlp.gate_proj,8.40142918,0.01000,1.131
162
+ 22,mlp.down_proj,0.49725312,0.01000,3.171
163
+ 23,self_attn.k_proj,4.44097424,0.01000,1.122
164
+ 23,self_attn.v_proj,1.51754737,0.01000,1.107
165
+ 23,self_attn.q_proj,7.22582531,0.01000,1.147
166
+ 23,self_attn.o_proj,0.12661582,0.01000,1.114
167
+ 23,mlp.up_proj,7.31189728,0.01000,1.131
168
+ 23,mlp.gate_proj,9.66457844,0.01000,1.122
169
+ 23,mlp.down_proj,0.59769487,0.01000,3.103
170
+ 24,self_attn.k_proj,4.87307644,0.01000,1.105
171
+ 24,self_attn.v_proj,2.15399027,0.01000,1.138
172
+ 24,self_attn.q_proj,7.82933807,0.01000,1.128
173
+ 24,self_attn.o_proj,0.14315630,0.01000,1.166
174
+ 24,mlp.up_proj,8.24588013,0.01000,1.124
175
+ 24,mlp.gate_proj,11.05454826,0.01000,1.127
176
+ 24,mlp.down_proj,0.74648660,0.01000,3.122
177
+ 25,self_attn.k_proj,4.00452709,0.01000,1.119
178
+ 25,self_attn.v_proj,1.98942447,0.01000,1.128
179
+ 25,self_attn.q_proj,7.78156376,0.01000,1.117
180
+ 25,self_attn.o_proj,0.19304600,0.01000,1.117
181
+ 25,mlp.up_proj,8.88384628,0.01000,1.165
182
+ 25,mlp.gate_proj,11.88053036,0.01000,1.126
183
+ 25,mlp.down_proj,0.99862719,0.01000,3.124
184
+ 26,self_attn.k_proj,4.53559971,0.01000,1.138
185
+ 26,self_attn.v_proj,2.68204308,0.01000,1.116
186
+ 26,self_attn.q_proj,7.01802683,0.01000,1.171
187
+ 26,self_attn.o_proj,0.28712690,0.01000,1.114
188
+ 26,mlp.up_proj,9.31034470,0.01000,1.128
189
+ 26,mlp.gate_proj,12.55875587,0.01000,1.154
190
+ 26,mlp.down_proj,1.47142649,0.01000,3.096
191
+ 27,self_attn.k_proj,3.15559483,0.01000,1.119
192
+ 27,self_attn.v_proj,1.72210693,0.01000,1.119
193
+ 27,self_attn.q_proj,5.58061886,0.01000,1.167
194
+ 27,self_attn.o_proj,0.70267087,0.01000,1.129
195
+ 27,mlp.up_proj,9.85498810,0.01000,1.158
196
+ 27,mlp.gate_proj,11.81561852,0.01000,1.139
197
+ 27,mlp.down_proj,3.57119989,0.01000,3.075