|
layer,module,loss,samples,damp,time
|
|
0,self_attn.k_proj,0.00069060,0.01000,1.029
|
|
0,self_attn.v_proj,0.00008147,0.01000,0.472
|
|
0,self_attn.q_proj,0.00321008,0.01000,0.482
|
|
0,self_attn.o_proj,0.00047103,0.01000,0.493
|
|
0,mlp.up_proj,0.00436171,0.01000,0.541
|
|
0,mlp.gate_proj,0.00562274,0.01000,0.505
|
|
0,mlp.down_proj,0.00085413,0.01000,3.217
|
|
1,self_attn.k_proj,0.00034248,0.01000,0.533
|
|
1,self_attn.v_proj,0.00006137,0.01000,0.472
|
|
1,self_attn.q_proj,0.00121677,0.01000,0.474
|
|
1,self_attn.o_proj,0.00011810,0.01000,0.494
|
|
1,mlp.up_proj,0.13315737,0.01000,0.513
|
|
1,mlp.gate_proj,0.17934367,0.01000,0.497
|
|
1,mlp.down_proj,0.00008329,0.01000,3.138
|
|
2,self_attn.k_proj,0.00038424,0.01000,0.557
|
|
2,self_attn.v_proj,0.00008452,0.01000,0.510
|
|
2,self_attn.q_proj,0.00170009,0.01000,0.516
|
|
2,self_attn.o_proj,0.00010261,0.01000,0.486
|
|
2,mlp.up_proj,0.05518855,0.01000,0.508
|
|
2,mlp.gate_proj,0.04516597,0.01000,0.494
|
|
2,mlp.down_proj,0.00515580,0.01000,3.216
|
|
3,self_attn.k_proj,0.00154116,0.01000,0.507
|
|
3,self_attn.v_proj,0.00029368,0.01000,0.507
|
|
3,self_attn.q_proj,0.00724024,0.01000,0.480
|
|
3,self_attn.o_proj,0.00018070,0.01000,0.490
|
|
3,mlp.up_proj,0.08040726,0.01000,0.511
|
|
3,mlp.gate_proj,0.07821976,0.01000,0.494
|
|
3,mlp.down_proj,0.00053932,0.01000,3.158
|
|
4,self_attn.k_proj,0.00095915,0.01000,0.502
|
|
4,self_attn.v_proj,0.00031529,0.01000,0.475
|
|
4,self_attn.q_proj,0.00489937,0.01000,0.478
|
|
4,self_attn.o_proj,0.00030713,0.01000,0.590
|
|
4,mlp.up_proj,0.05972803,0.01000,0.514
|
|
4,mlp.gate_proj,0.07408385,0.01000,0.552
|
|
4,mlp.down_proj,0.00066552,0.01000,3.155
|
|
5,self_attn.k_proj,0.00147027,0.01000,0.493
|
|
5,self_attn.v_proj,0.00048919,0.01000,0.505
|
|
5,self_attn.q_proj,0.00825339,0.01000,0.559
|
|
5,self_attn.o_proj,0.00023145,0.01000,0.502
|
|
5,mlp.up_proj,0.08986730,0.01000,0.519
|
|
5,mlp.gate_proj,0.10963946,0.01000,0.501
|
|
5,mlp.down_proj,0.00130154,0.01000,3.170
|
|
6,self_attn.k_proj,0.00103089,0.01000,0.504
|
|
6,self_attn.v_proj,0.00061901,0.01000,0.471
|
|
6,self_attn.q_proj,0.00609575,0.01000,0.473
|
|
6,self_attn.o_proj,0.00063878,0.01000,0.489
|
|
6,mlp.up_proj,0.11683443,0.01000,0.511
|
|
6,mlp.gate_proj,0.13332176,0.01000,0.500
|
|
6,mlp.down_proj,0.00145119,0.01000,3.157
|
|
7,self_attn.k_proj,0.00135148,0.01000,0.495
|
|
7,self_attn.v_proj,0.00083617,0.01000,0.468
|
|
7,self_attn.q_proj,0.00884062,0.01000,0.472
|
|
7,self_attn.o_proj,0.00045116,0.01000,0.491
|
|
7,mlp.up_proj,0.12256874,0.01000,0.532
|
|
7,mlp.gate_proj,0.14637680,0.01000,0.573
|
|
7,mlp.down_proj,0.00233087,0.01000,3.185
|
|
8,self_attn.k_proj,0.00143536,0.01000,0.500
|
|
8,self_attn.v_proj,0.00096026,0.01000,0.524
|
|
8,self_attn.q_proj,0.00936532,0.01000,0.530
|
|
8,self_attn.o_proj,0.00049681,0.01000,0.540
|
|
8,mlp.up_proj,0.12503704,0.01000,0.526
|
|
8,mlp.gate_proj,0.17915115,0.01000,0.505
|
|
8,mlp.down_proj,0.00234245,0.01000,3.183
|
|
9,self_attn.k_proj,0.00143120,0.01000,0.505
|
|
9,self_attn.v_proj,0.00079513,0.01000,0.479
|
|
9,self_attn.q_proj,0.00797836,0.01000,0.478
|
|
9,self_attn.o_proj,0.00068180,0.01000,0.495
|
|
9,mlp.up_proj,0.11117899,0.01000,0.518
|
|
9,mlp.gate_proj,0.16715510,0.01000,0.498
|
|
9,mlp.down_proj,0.00310383,0.01000,3.162
|
|
10,self_attn.k_proj,0.00160306,0.01000,0.492
|
|
10,self_attn.v_proj,0.00109001,0.01000,0.470
|
|
10,self_attn.q_proj,0.01080495,0.01000,0.478
|
|
10,self_attn.o_proj,0.00084409,0.01000,0.504
|
|
10,mlp.up_proj,0.08392834,0.01000,0.521
|
|
10,mlp.gate_proj,0.12971427,0.01000,0.562
|
|
10,mlp.down_proj,0.00405339,0.01000,3.183
|
|
11,self_attn.k_proj,0.00122218,0.01000,0.493
|
|
11,self_attn.v_proj,0.00099423,0.01000,0.550
|
|
11,self_attn.q_proj,0.00794288,0.01000,0.553
|
|
11,self_attn.o_proj,0.00098513,0.01000,0.497
|
|
11,mlp.up_proj,0.04812239,0.01000,0.509
|
|
11,mlp.gate_proj,0.06757517,0.01000,0.493
|
|
11,mlp.down_proj,0.00568819,0.01000,3.207
|
|
12,self_attn.k_proj,0.00135649,0.01000,0.495
|
|
12,self_attn.v_proj,0.00095998,0.01000,0.483
|
|
12,self_attn.q_proj,0.00892941,0.01000,0.483
|
|
12,self_attn.o_proj,0.00108744,0.01000,0.522
|
|
12,mlp.up_proj,0.05381161,0.01000,0.529
|
|
12,mlp.gate_proj,0.07598484,0.01000,0.505
|
|
12,mlp.down_proj,0.00539491,0.01000,3.291
|
|
13,self_attn.k_proj,0.00178134,0.01000,0.527
|
|
13,self_attn.v_proj,0.00058557,0.01000,0.491
|
|
13,self_attn.q_proj,0.00892488,0.01000,0.516
|
|
13,self_attn.o_proj,0.00064293,0.01000,0.504
|
|
13,mlp.up_proj,0.04396489,0.01000,0.554
|
|
13,mlp.gate_proj,0.04568858,0.01000,0.527
|
|
13,mlp.down_proj,0.00565900,0.01000,3.395
|
|
14,self_attn.k_proj,0.00135609,0.01000,0.493
|
|
14,self_attn.v_proj,0.00082203,0.01000,0.547
|
|
14,self_attn.q_proj,0.00883573,0.01000,0.470
|
|
14,self_attn.o_proj,0.00131206,0.01000,0.507
|
|
14,mlp.up_proj,0.04743307,0.01000,0.513
|
|
14,mlp.gate_proj,0.04887400,0.01000,0.497
|
|
14,mlp.down_proj,0.00661326,0.01000,3.147
|
|
15,self_attn.k_proj,0.00155714,0.01000,0.506
|
|
15,self_attn.v_proj,0.00092119,0.01000,0.479
|
|
15,self_attn.q_proj,0.00995570,0.01000,0.539
|
|
15,self_attn.o_proj,0.00136074,0.01000,0.500
|
|
15,mlp.up_proj,0.04853380,0.01000,0.511
|
|
15,mlp.gate_proj,0.04559516,0.01000,0.495
|
|
15,mlp.down_proj,0.00638492,0.01000,3.148
|
|
16,self_attn.k_proj,0.00198390,0.01000,0.530
|
|
16,self_attn.v_proj,0.00113709,0.01000,0.507
|
|
16,self_attn.q_proj,0.01223878,0.01000,0.475
|
|
16,self_attn.o_proj,0.00148312,0.01000,0.489
|
|
16,mlp.up_proj,0.04892960,0.01000,0.541
|
|
16,mlp.gate_proj,0.05012077,0.01000,0.561
|
|
16,mlp.down_proj,0.00597043,0.01000,3.166
|
|
17,self_attn.k_proj,0.00280038,0.01000,0.496
|
|
17,self_attn.v_proj,0.00146818,0.01000,0.540
|
|
17,self_attn.q_proj,0.01687030,0.01000,0.497
|
|
17,self_attn.o_proj,0.00135879,0.01000,0.496
|
|
17,mlp.up_proj,0.04682782,0.01000,0.510
|
|
17,mlp.gate_proj,0.04579859,0.01000,0.492
|
|
17,mlp.down_proj,0.00761481,0.01000,3.238
|
|
18,self_attn.k_proj,0.00169533,0.01000,0.504
|
|
18,self_attn.v_proj,0.00126828,0.01000,0.471
|
|
18,self_attn.q_proj,0.01179836,0.01000,0.482
|
|
18,self_attn.o_proj,0.00126228,0.01000,0.522
|
|
18,mlp.up_proj,0.04505775,0.01000,0.512
|
|
18,mlp.gate_proj,0.04577068,0.01000,0.498
|
|
18,mlp.down_proj,0.00619347,0.01000,3.186
|
|
19,self_attn.k_proj,0.00236209,0.01000,0.514
|
|
19,self_attn.v_proj,0.00123736,0.01000,0.491
|
|
19,self_attn.q_proj,0.01400776,0.01000,0.526
|
|
19,self_attn.o_proj,0.00176100,0.01000,0.493
|
|
19,mlp.up_proj,0.04820779,0.01000,0.553
|
|
19,mlp.gate_proj,0.04570930,0.01000,0.600
|
|
19,mlp.down_proj,0.00793979,0.01000,3.357
|
|
20,self_attn.k_proj,0.00256892,0.01000,0.493
|
|
20,self_attn.v_proj,0.00260168,0.01000,0.550
|
|
20,self_attn.q_proj,0.02125032,0.01000,0.477
|
|
20,self_attn.o_proj,0.00280044,0.01000,0.497
|
|
20,mlp.up_proj,0.05057632,0.01000,0.519
|
|
20,mlp.gate_proj,0.04847589,0.01000,0.495
|
|
20,mlp.down_proj,0.00903307,0.01000,3.187
|
|
21,self_attn.k_proj,0.00277045,0.01000,0.500
|
|
21,self_attn.v_proj,0.00198452,0.01000,0.478
|
|
21,self_attn.q_proj,0.01851394,0.01000,0.479
|
|
21,self_attn.o_proj,0.00218527,0.01000,0.496
|
|
21,mlp.up_proj,0.05114579,0.01000,0.519
|
|
21,mlp.gate_proj,0.05338387,0.01000,0.499
|
|
21,mlp.down_proj,0.00733775,0.01000,3.188
|
|
22,self_attn.k_proj,0.00326175,0.01000,0.494
|
|
22,self_attn.v_proj,0.00250720,0.01000,0.475
|
|
22,self_attn.q_proj,0.02128556,0.01000,0.477
|
|
22,self_attn.o_proj,0.00235567,0.01000,0.492
|
|
22,mlp.up_proj,0.05586936,0.01000,0.570
|
|
22,mlp.gate_proj,0.05644500,0.01000,0.512
|
|
22,mlp.down_proj,0.00800653,0.01000,3.235
|
|
23,self_attn.k_proj,0.00299606,0.01000,0.494
|
|
23,self_attn.v_proj,0.00155715,0.01000,0.471
|
|
23,self_attn.q_proj,0.01925512,0.01000,0.473
|
|
23,self_attn.o_proj,0.00178259,0.01000,0.536
|
|
23,mlp.up_proj,0.06007682,0.01000,0.521
|
|
23,mlp.gate_proj,0.05663780,0.01000,0.496
|
|
23,mlp.down_proj,0.00945445,0.01000,9.186
|
|
24,self_attn.k_proj,0.00225264,0.01000,0.980
|
|
24,self_attn.v_proj,0.00187703,0.01000,1.371
|
|
24,self_attn.q_proj,0.01681715,0.01000,6.686
|
|
24,self_attn.o_proj,0.00246775,0.01000,1.328
|
|
24,mlp.up_proj,0.06072681,0.01000,0.944
|
|
24,mlp.gate_proj,0.05807892,0.01000,1.001
|
|
24,mlp.down_proj,0.00991773,0.01000,18.358
|
|
25,self_attn.k_proj,0.00229649,0.01000,8.503
|
|
25,self_attn.v_proj,0.00291831,0.01000,4.319
|
|
25,self_attn.q_proj,0.02437538,0.01000,3.804
|
|
25,self_attn.o_proj,0.00237260,0.01000,1.286
|
|
25,mlp.up_proj,0.06846089,0.01000,10.826
|
|
25,mlp.gate_proj,0.06569070,0.01000,9.100
|
|
25,mlp.down_proj,0.01337931,0.01000,33.601
|
|
26,self_attn.k_proj,0.00267915,0.01000,1.255
|
|
26,self_attn.v_proj,0.00322842,0.01000,3.481
|
|
26,self_attn.q_proj,0.02083185,0.01000,5.436
|
|
26,self_attn.o_proj,0.00308602,0.01000,7.156
|
|
26,mlp.up_proj,0.08263549,0.01000,1.335
|
|
26,mlp.gate_proj,0.07662739,0.01000,3.503
|
|
26,mlp.down_proj,0.01771094,0.01000,21.777
|
|
27,self_attn.k_proj,0.00287940,0.01000,3.159
|
|
27,self_attn.v_proj,0.00416089,0.01000,4.204
|
|
27,self_attn.q_proj,0.03279902,0.01000,1.774
|
|
27,self_attn.o_proj,0.00550491,0.01000,3.372
|
|
27,mlp.up_proj,0.09059777,0.01000,3.954
|
|
27,mlp.gate_proj,0.08867668,0.01000,9.505
|
|
27,mlp.down_proj,0.02109897,0.01000,30.538
|
|
28,self_attn.k_proj,0.00278399,0.01000,7.684
|
|
28,self_attn.v_proj,0.00438421,0.01000,1.185
|
|
28,self_attn.q_proj,0.02441998,0.01000,1.490
|
|
28,self_attn.o_proj,0.00504620,0.01000,1.659
|
|
28,mlp.up_proj,0.10423768,0.01000,6.048
|
|
28,mlp.gate_proj,0.10313836,0.01000,2.000
|
|
28,mlp.down_proj,0.02453683,0.01000,25.117
|
|
29,self_attn.k_proj,0.00324912,0.01000,7.286
|
|
29,self_attn.v_proj,0.00431707,0.01000,3.652
|
|
29,self_attn.q_proj,0.02698709,0.01000,9.020
|
|
29,self_attn.o_proj,0.00393811,0.01000,1.285
|
|
29,mlp.up_proj,0.13072219,0.01000,7.825
|
|
29,mlp.gate_proj,0.12731788,0.01000,1.260
|
|
29,mlp.down_proj,0.03455354,0.01000,31.130
|
|
30,self_attn.k_proj,0.00299078,0.01000,3.355
|
|
30,self_attn.v_proj,0.00842608,0.01000,1.227
|
|
30,self_attn.q_proj,0.02935425,0.01000,9.509
|
|
30,self_attn.o_proj,0.00491209,0.01000,6.748
|
|
30,mlp.up_proj,0.17074524,0.01000,1.335
|
|
30,mlp.gate_proj,0.15690112,0.01000,1.254
|
|
30,mlp.down_proj,0.09282688,0.01000,20.732
|
|
31,self_attn.k_proj,0.00382955,0.01000,8.693
|
|
31,self_attn.v_proj,0.01071948,0.01000,5.567
|
|
31,self_attn.q_proj,0.03053109,0.01000,1.216
|
|
31,self_attn.o_proj,0.00866138,0.01000,2.271
|
|
31,mlp.up_proj,0.20006534,0.01000,9.636
|
|
31,mlp.gate_proj,0.17307433,0.01000,4.535
|
|
31,mlp.down_proj,0.08568206,0.01000,26.561
|
|
32,self_attn.k_proj,0.00522043,0.01000,4.314
|
|
32,self_attn.v_proj,0.03462721,0.01000,9.529
|
|
32,self_attn.q_proj,0.04134069,0.01000,2.139
|
|
32,self_attn.o_proj,0.00988561,0.01000,2.949
|
|
32,mlp.up_proj,0.19264194,0.01000,2.229
|
|
32,mlp.gate_proj,0.16856745,0.01000,4.380
|
|
32,mlp.down_proj,0.08202425,0.01000,25.548
|
|
33,self_attn.k_proj,0.00480200,0.01000,1.251
|
|
33,self_attn.v_proj,0.07019998,0.01000,1.479
|
|
33,self_attn.q_proj,0.05121958,0.01000,7.949
|
|
33,self_attn.o_proj,0.01627044,0.01000,5.901
|
|
33,mlp.up_proj,0.17824389,0.01000,1.281
|
|
33,mlp.gate_proj,0.14435218,0.01000,3.857
|
|
33,mlp.down_proj,0.14946091,0.01000,24.800
|
|
34,self_attn.k_proj,0.00254513,0.01000,8.091
|
|
34,self_attn.v_proj,0.00760822,0.01000,1.215
|
|
34,self_attn.q_proj,0.02376374,0.01000,1.308
|
|
34,self_attn.o_proj,0.01036366,0.01000,12.004
|
|
34,mlp.up_proj,0.18489864,0.01000,3.845
|
|
34,mlp.gate_proj,0.15819445,0.01000,1.324
|
|
34,mlp.down_proj,0.09072845,0.01000,20.542
|
|
35,self_attn.k_proj,0.00257981,0.01000,1.463
|
|
35,self_attn.v_proj,0.00711143,0.01000,7.436
|
|
35,self_attn.q_proj,0.02256388,0.01000,4.156
|
|
35,self_attn.o_proj,0.00808490,0.01000,1.323
|
|
35,mlp.up_proj,0.23674777,0.01000,13.245
|
|
35,mlp.gate_proj,0.22639820,0.01000,13.503
|
|
35,mlp.down_proj,0.13450164,0.01000,23.163
|
|
|