|
layer,module,loss,samples,damp,time
|
|
0,self_attn.k_proj,0.0000432854,0.05000,1.766
|
|
0,self_attn.v_proj,0.0000049972,0.05000,1.793
|
|
0,self_attn.q_proj,0.0001757931,0.05000,1.798
|
|
0,self_attn.o_proj,0.0000108898,0.05000,0.778
|
|
0,mlp.up_proj,0.0003301854,0.05000,1.146
|
|
0,mlp.gate_proj,0.0007666261,0.05000,1.183
|
|
0,mlp.down_proj,0.0000141513,0.05000,5.336
|
|
1,self_attn.k_proj,0.0000358306,0.05000,1.767
|
|
1,self_attn.q_proj,0.0001356997,0.05000,1.789
|
|
1,self_attn.v_proj,0.0000092715,0.05000,1.792
|
|
1,self_attn.o_proj,0.0000043125,0.05000,0.785
|
|
1,mlp.up_proj,0.0068297327,0.05000,1.161
|
|
1,mlp.gate_proj,0.0110956548,0.05000,1.184
|
|
1,mlp.down_proj,0.0000095164,0.05000,5.333
|
|
2,self_attn.k_proj,0.0000858678,0.05000,1.750
|
|
2,self_attn.v_proj,0.0000151014,0.05000,1.786
|
|
2,self_attn.q_proj,0.0003180285,0.05000,1.790
|
|
2,self_attn.o_proj,0.0000078531,0.05000,0.777
|
|
2,mlp.up_proj,0.0060570274,0.05000,1.143
|
|
2,mlp.gate_proj,0.0098869666,0.05000,1.177
|
|
2,mlp.down_proj,0.0000373999,0.05000,5.348
|
|
3,self_attn.k_proj,0.0000810958,0.05000,1.771
|
|
3,self_attn.q_proj,0.0003177889,0.05000,1.790
|
|
3,self_attn.v_proj,0.0000203367,0.05000,1.792
|
|
3,self_attn.o_proj,0.0000193827,0.05000,0.780
|
|
3,mlp.up_proj,0.0127348766,0.05000,1.154
|
|
3,mlp.gate_proj,0.0171400174,0.05000,1.185
|
|
3,mlp.down_proj,0.0021732034,0.05000,5.357
|
|
4,self_attn.k_proj,0.0001399196,0.05000,1.776
|
|
4,self_attn.q_proj,0.0006156289,0.05000,1.794
|
|
4,self_attn.v_proj,0.0000480736,0.05000,1.796
|
|
4,self_attn.o_proj,0.0000394140,0.05000,0.788
|
|
4,mlp.up_proj,0.0090971480,0.05000,1.153
|
|
4,mlp.gate_proj,0.0135318746,0.05000,1.185
|
|
4,mlp.down_proj,0.0023862841,0.05000,5.319
|
|
5,self_attn.k_proj,0.0001325996,0.05000,1.784
|
|
5,self_attn.q_proj,0.0006572159,0.05000,1.797
|
|
5,self_attn.v_proj,0.0000548861,0.05000,1.799
|
|
5,self_attn.o_proj,0.0000599871,0.05000,0.795
|
|
5,mlp.up_proj,0.0147371594,0.05000,1.171
|
|
5,mlp.gate_proj,0.0186996124,0.05000,1.195
|
|
5,mlp.down_proj,0.0002437168,0.05000,5.403
|
|
6,self_attn.k_proj,0.0000885772,0.05000,1.742
|
|
6,self_attn.v_proj,0.0000421790,0.05000,1.777
|
|
6,self_attn.q_proj,0.0004314109,0.05000,1.783
|
|
6,self_attn.o_proj,0.0000446818,0.05000,0.794
|
|
6,mlp.up_proj,0.0026338197,0.05000,1.157
|
|
6,mlp.gate_proj,0.0037542884,0.05000,1.188
|
|
6,mlp.down_proj,0.0000997583,0.05000,5.390
|
|
7,self_attn.k_proj,0.0000925571,0.05000,1.789
|
|
7,self_attn.q_proj,0.0005228582,0.05000,1.802
|
|
7,self_attn.v_proj,0.0000846739,0.05000,1.804
|
|
7,self_attn.o_proj,0.0000540034,0.05000,0.791
|
|
7,mlp.up_proj,0.0021272203,0.05000,1.164
|
|
7,mlp.gate_proj,0.0023616219,0.05000,1.187
|
|
7,mlp.down_proj,0.0001141313,0.05000,5.314
|
|
8,self_attn.k_proj,0.0001738771,0.05000,1.777
|
|
8,self_attn.v_proj,0.0000707547,0.05000,1.794
|
|
8,self_attn.q_proj,0.0007570342,0.05000,1.799
|
|
8,self_attn.o_proj,0.0000702879,0.05000,0.788
|
|
8,mlp.up_proj,0.0023392382,0.05000,1.160
|
|
8,mlp.gate_proj,0.0024381351,0.05000,1.184
|
|
8,mlp.down_proj,0.0001141036,0.05000,5.359
|
|
9,self_attn.k_proj,0.0001255440,0.05000,1.747
|
|
9,self_attn.v_proj,0.0001075853,0.05000,1.781
|
|
9,self_attn.q_proj,0.0006896859,0.05000,1.785
|
|
9,self_attn.o_proj,0.0000752609,0.05000,0.778
|
|
9,mlp.up_proj,0.0046194003,0.05000,1.152
|
|
9,mlp.gate_proj,0.0072552940,0.05000,1.185
|
|
9,mlp.down_proj,0.0001435438,0.05000,5.375
|
|
10,self_attn.v_proj,0.0000711022,0.05000,1.815
|
|
10,self_attn.k_proj,0.0001285309,0.05000,1.819
|
|
10,self_attn.q_proj,0.0006438414,0.05000,1.842
|
|
10,self_attn.o_proj,0.0000531726,0.05000,0.780
|
|
10,mlp.up_proj,0.0023653700,0.05000,1.150
|
|
10,mlp.gate_proj,0.0026815632,0.05000,1.183
|
|
10,mlp.down_proj,0.0000887731,0.05000,5.373
|
|
11,self_attn.k_proj,0.0001696957,0.05000,1.778
|
|
11,self_attn.v_proj,0.0000648065,0.05000,1.797
|
|
11,self_attn.q_proj,0.0007402942,0.05000,1.801
|
|
11,self_attn.o_proj,0.0000742858,0.05000,0.783
|
|
11,mlp.up_proj,0.0021493328,0.05000,1.163
|
|
11,mlp.gate_proj,0.0022600763,0.05000,1.190
|
|
11,mlp.down_proj,0.0002429208,0.05000,5.360
|
|
12,self_attn.k_proj,0.0001913924,0.05000,1.775
|
|
12,self_attn.v_proj,0.0000848261,0.05000,1.794
|
|
12,self_attn.q_proj,0.0008414217,0.05000,1.799
|
|
12,self_attn.o_proj,0.0000603520,0.05000,0.791
|
|
12,mlp.up_proj,0.0021892047,0.05000,1.165
|
|
12,mlp.gate_proj,0.0021619192,0.05000,1.188
|
|
12,mlp.down_proj,0.0000992026,0.05000,5.388
|
|
13,self_attn.k_proj,0.0001764100,0.05000,1.783
|
|
13,self_attn.v_proj,0.0001123422,0.05000,1.800
|
|
13,self_attn.q_proj,0.0009153854,0.05000,1.803
|
|
13,self_attn.o_proj,0.0000794259,0.05000,0.789
|
|
13,mlp.up_proj,0.0022109749,0.05000,1.161
|
|
13,mlp.gate_proj,0.0023554429,0.05000,1.187
|
|
13,mlp.down_proj,0.0000893284,0.05000,5.370
|
|
14,self_attn.k_proj,0.0002561925,0.05000,1.782
|
|
14,self_attn.v_proj,0.0001154645,0.05000,1.787
|
|
14,self_attn.q_proj,0.0013007666,0.05000,1.813
|
|
14,self_attn.o_proj,0.0001204233,0.05000,0.781
|
|
14,mlp.up_proj,0.0025638388,0.05000,1.145
|
|
14,mlp.gate_proj,0.0025896619,0.05000,1.171
|
|
14,mlp.down_proj,0.0000961390,0.05000,5.339
|
|
15,self_attn.k_proj,0.0002411058,0.05000,1.771
|
|
15,self_attn.v_proj,0.0001010086,0.05000,1.779
|
|
15,self_attn.q_proj,0.0010763963,0.05000,1.806
|
|
15,self_attn.o_proj,0.0001248457,0.05000,0.779
|
|
15,mlp.up_proj,0.0025943129,0.05000,1.146
|
|
15,mlp.gate_proj,0.0025343251,0.05000,1.173
|
|
15,mlp.down_proj,0.0001141996,0.05000,5.327
|
|
16,self_attn.k_proj,0.0002437389,0.05000,1.762
|
|
16,self_attn.v_proj,0.0001444091,0.05000,1.778
|
|
16,self_attn.q_proj,0.0012326450,0.05000,1.798
|
|
16,self_attn.o_proj,0.0001986508,0.05000,0.780
|
|
16,mlp.up_proj,0.0028457921,0.05000,1.147
|
|
16,mlp.gate_proj,0.0027699758,0.05000,1.172
|
|
16,mlp.down_proj,0.0001097131,0.05000,5.343
|
|
17,self_attn.k_proj,0.0002372200,0.05000,1.779
|
|
17,self_attn.v_proj,0.0001644637,0.05000,1.785
|
|
17,self_attn.q_proj,0.0013344949,0.05000,1.804
|
|
17,self_attn.o_proj,0.0001687157,0.05000,0.777
|
|
17,mlp.up_proj,0.0034605139,0.05000,1.152
|
|
17,mlp.gate_proj,0.0032823749,0.05000,1.177
|
|
17,mlp.down_proj,0.0001509321,0.05000,5.323
|
|
18,self_attn.k_proj,0.0001887011,0.05000,1.765
|
|
18,self_attn.v_proj,0.0001808350,0.05000,1.779
|
|
18,self_attn.q_proj,0.0010705749,0.05000,1.801
|
|
18,self_attn.o_proj,0.0001657871,0.05000,0.783
|
|
18,mlp.up_proj,0.0040642183,0.05000,1.148
|
|
18,mlp.gate_proj,0.0037679110,0.05000,1.174
|
|
18,mlp.down_proj,0.0002181015,0.05000,5.336
|
|
19,self_attn.k_proj,0.0002055513,0.05000,1.769
|
|
19,self_attn.v_proj,0.0002454614,0.05000,1.785
|
|
19,self_attn.q_proj,0.0013781268,0.05000,1.805
|
|
19,self_attn.o_proj,0.0002243668,0.05000,0.781
|
|
19,mlp.up_proj,0.0046072615,0.05000,1.154
|
|
19,mlp.gate_proj,0.0044774732,0.05000,1.177
|
|
19,mlp.down_proj,0.0002187767,0.05000,5.333
|
|
20,self_attn.k_proj,0.0002085851,0.05000,1.772
|
|
20,self_attn.v_proj,0.0002610162,0.05000,1.786
|
|
20,self_attn.q_proj,0.0013019970,0.05000,1.806
|
|
20,self_attn.o_proj,0.0001514216,0.05000,0.781
|
|
20,mlp.up_proj,0.0054252240,0.05000,1.148
|
|
20,mlp.gate_proj,0.0051634870,0.05000,1.173
|
|
20,mlp.down_proj,0.0003712054,0.05000,5.326
|
|
21,self_attn.k_proj,0.0002118031,0.05000,1.759
|
|
21,self_attn.v_proj,0.0003764736,0.05000,1.772
|
|
21,self_attn.q_proj,0.0015059532,0.05000,1.788
|
|
21,self_attn.o_proj,0.0004255283,0.05000,0.782
|
|
21,mlp.up_proj,0.0066461328,0.05000,1.147
|
|
21,mlp.gate_proj,0.0066254139,0.05000,1.174
|
|
21,mlp.down_proj,0.0005992475,0.05000,5.317
|
|
22,self_attn.k_proj,0.0002988659,0.05000,1.769
|
|
22,self_attn.v_proj,0.0005736383,0.05000,1.783
|
|
22,self_attn.q_proj,0.0021297575,0.05000,1.807
|
|
22,self_attn.o_proj,0.0004206545,0.05000,0.780
|
|
22,mlp.up_proj,0.0094454406,0.05000,1.151
|
|
22,mlp.gate_proj,0.0092535556,0.05000,1.175
|
|
22,mlp.down_proj,0.0008095826,0.05000,5.324
|
|
23,self_attn.k_proj,0.0003835323,0.05000,1.771
|
|
23,self_attn.v_proj,0.0007766295,0.05000,1.785
|
|
23,self_attn.q_proj,0.0024568439,0.05000,1.806
|
|
23,self_attn.o_proj,0.0008100346,0.05000,0.780
|
|
23,mlp.up_proj,0.0125601661,0.05000,1.148
|
|
23,mlp.gate_proj,0.0126166713,0.05000,1.174
|
|
23,mlp.down_proj,0.0009607696,0.05000,5.323
|
|
24,self_attn.k_proj,0.0003131202,0.05000,1.760
|
|
24,self_attn.v_proj,0.0008387528,0.05000,1.777
|
|
24,self_attn.q_proj,0.0022884397,0.05000,1.799
|
|
24,self_attn.o_proj,0.0006900308,0.05000,0.784
|
|
24,mlp.up_proj,0.0137791785,0.05000,1.152
|
|
24,mlp.gate_proj,0.0128174114,0.05000,1.177
|
|
24,mlp.down_proj,0.0013900608,0.05000,5.345
|
|
25,self_attn.k_proj,0.0003696309,0.05000,1.796
|
|
25,self_attn.v_proj,0.0014799064,0.05000,1.798
|
|
25,self_attn.q_proj,0.0027035042,0.05000,1.818
|
|
25,self_attn.o_proj,0.0010714627,0.05000,0.780
|
|
25,mlp.up_proj,0.0188588492,0.05000,1.149
|
|
25,mlp.gate_proj,0.0167194957,0.05000,1.181
|
|
25,mlp.down_proj,0.0112290785,0.05000,5.347
|
|
26,self_attn.k_proj,0.0005632932,0.05000,1.775
|
|
26,self_attn.v_proj,0.0039053194,0.05000,1.784
|
|
26,self_attn.q_proj,0.0044603734,0.05000,1.806
|
|
26,self_attn.o_proj,0.0024405535,0.05000,0.786
|
|
26,mlp.up_proj,0.0201260808,0.05000,1.157
|
|
26,mlp.gate_proj,0.0176544122,0.05000,1.180
|
|
26,mlp.down_proj,0.0254254744,0.05000,5.332
|
|
27,self_attn.k_proj,0.0007584638,0.05000,1.767
|
|
27,self_attn.v_proj,0.0063212753,0.05000,1.781
|
|
27,self_attn.q_proj,0.0070051274,0.05000,1.795
|
|
27,self_attn.o_proj,0.0045859847,0.05000,0.785
|
|
27,mlp.up_proj,0.0242716040,0.05000,1.155
|
|
27,mlp.gate_proj,0.0231725800,0.05000,1.181
|
|
27,mlp.down_proj,0.0212887442,0.05000,5.341
|
|
|