viveksil's picture
Add files using upload-large-folder tool
5d63dbc verified
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.00069060,0.01000,1.029
0,self_attn.v_proj,0.00008147,0.01000,0.472
0,self_attn.q_proj,0.00321008,0.01000,0.482
0,self_attn.o_proj,0.00047103,0.01000,0.493
0,mlp.up_proj,0.00436171,0.01000,0.541
0,mlp.gate_proj,0.00562274,0.01000,0.505
0,mlp.down_proj,0.00085413,0.01000,3.217
1,self_attn.k_proj,0.00034248,0.01000,0.533
1,self_attn.v_proj,0.00006137,0.01000,0.472
1,self_attn.q_proj,0.00121677,0.01000,0.474
1,self_attn.o_proj,0.00011810,0.01000,0.494
1,mlp.up_proj,0.13315737,0.01000,0.513
1,mlp.gate_proj,0.17934367,0.01000,0.497
1,mlp.down_proj,0.00008329,0.01000,3.138
2,self_attn.k_proj,0.00038424,0.01000,0.557
2,self_attn.v_proj,0.00008452,0.01000,0.510
2,self_attn.q_proj,0.00170009,0.01000,0.516
2,self_attn.o_proj,0.00010261,0.01000,0.486
2,mlp.up_proj,0.05518855,0.01000,0.508
2,mlp.gate_proj,0.04516597,0.01000,0.494
2,mlp.down_proj,0.00515580,0.01000,3.216
3,self_attn.k_proj,0.00154116,0.01000,0.507
3,self_attn.v_proj,0.00029368,0.01000,0.507
3,self_attn.q_proj,0.00724024,0.01000,0.480
3,self_attn.o_proj,0.00018070,0.01000,0.490
3,mlp.up_proj,0.08040726,0.01000,0.511
3,mlp.gate_proj,0.07821976,0.01000,0.494
3,mlp.down_proj,0.00053932,0.01000,3.158
4,self_attn.k_proj,0.00095915,0.01000,0.502
4,self_attn.v_proj,0.00031529,0.01000,0.475
4,self_attn.q_proj,0.00489937,0.01000,0.478
4,self_attn.o_proj,0.00030713,0.01000,0.590
4,mlp.up_proj,0.05972803,0.01000,0.514
4,mlp.gate_proj,0.07408385,0.01000,0.552
4,mlp.down_proj,0.00066552,0.01000,3.155
5,self_attn.k_proj,0.00147027,0.01000,0.493
5,self_attn.v_proj,0.00048919,0.01000,0.505
5,self_attn.q_proj,0.00825339,0.01000,0.559
5,self_attn.o_proj,0.00023145,0.01000,0.502
5,mlp.up_proj,0.08986730,0.01000,0.519
5,mlp.gate_proj,0.10963946,0.01000,0.501
5,mlp.down_proj,0.00130154,0.01000,3.170
6,self_attn.k_proj,0.00103089,0.01000,0.504
6,self_attn.v_proj,0.00061901,0.01000,0.471
6,self_attn.q_proj,0.00609575,0.01000,0.473
6,self_attn.o_proj,0.00063878,0.01000,0.489
6,mlp.up_proj,0.11683443,0.01000,0.511
6,mlp.gate_proj,0.13332176,0.01000,0.500
6,mlp.down_proj,0.00145119,0.01000,3.157
7,self_attn.k_proj,0.00135148,0.01000,0.495
7,self_attn.v_proj,0.00083617,0.01000,0.468
7,self_attn.q_proj,0.00884062,0.01000,0.472
7,self_attn.o_proj,0.00045116,0.01000,0.491
7,mlp.up_proj,0.12256874,0.01000,0.532
7,mlp.gate_proj,0.14637680,0.01000,0.573
7,mlp.down_proj,0.00233087,0.01000,3.185
8,self_attn.k_proj,0.00143536,0.01000,0.500
8,self_attn.v_proj,0.00096026,0.01000,0.524
8,self_attn.q_proj,0.00936532,0.01000,0.530
8,self_attn.o_proj,0.00049681,0.01000,0.540
8,mlp.up_proj,0.12503704,0.01000,0.526
8,mlp.gate_proj,0.17915115,0.01000,0.505
8,mlp.down_proj,0.00234245,0.01000,3.183
9,self_attn.k_proj,0.00143120,0.01000,0.505
9,self_attn.v_proj,0.00079513,0.01000,0.479
9,self_attn.q_proj,0.00797836,0.01000,0.478
9,self_attn.o_proj,0.00068180,0.01000,0.495
9,mlp.up_proj,0.11117899,0.01000,0.518
9,mlp.gate_proj,0.16715510,0.01000,0.498
9,mlp.down_proj,0.00310383,0.01000,3.162
10,self_attn.k_proj,0.00160306,0.01000,0.492
10,self_attn.v_proj,0.00109001,0.01000,0.470
10,self_attn.q_proj,0.01080495,0.01000,0.478
10,self_attn.o_proj,0.00084409,0.01000,0.504
10,mlp.up_proj,0.08392834,0.01000,0.521
10,mlp.gate_proj,0.12971427,0.01000,0.562
10,mlp.down_proj,0.00405339,0.01000,3.183
11,self_attn.k_proj,0.00122218,0.01000,0.493
11,self_attn.v_proj,0.00099423,0.01000,0.550
11,self_attn.q_proj,0.00794288,0.01000,0.553
11,self_attn.o_proj,0.00098513,0.01000,0.497
11,mlp.up_proj,0.04812239,0.01000,0.509
11,mlp.gate_proj,0.06757517,0.01000,0.493
11,mlp.down_proj,0.00568819,0.01000,3.207
12,self_attn.k_proj,0.00135649,0.01000,0.495
12,self_attn.v_proj,0.00095998,0.01000,0.483
12,self_attn.q_proj,0.00892941,0.01000,0.483
12,self_attn.o_proj,0.00108744,0.01000,0.522
12,mlp.up_proj,0.05381161,0.01000,0.529
12,mlp.gate_proj,0.07598484,0.01000,0.505
12,mlp.down_proj,0.00539491,0.01000,3.291
13,self_attn.k_proj,0.00178134,0.01000,0.527
13,self_attn.v_proj,0.00058557,0.01000,0.491
13,self_attn.q_proj,0.00892488,0.01000,0.516
13,self_attn.o_proj,0.00064293,0.01000,0.504
13,mlp.up_proj,0.04396489,0.01000,0.554
13,mlp.gate_proj,0.04568858,0.01000,0.527
13,mlp.down_proj,0.00565900,0.01000,3.395
14,self_attn.k_proj,0.00135609,0.01000,0.493
14,self_attn.v_proj,0.00082203,0.01000,0.547
14,self_attn.q_proj,0.00883573,0.01000,0.470
14,self_attn.o_proj,0.00131206,0.01000,0.507
14,mlp.up_proj,0.04743307,0.01000,0.513
14,mlp.gate_proj,0.04887400,0.01000,0.497
14,mlp.down_proj,0.00661326,0.01000,3.147
15,self_attn.k_proj,0.00155714,0.01000,0.506
15,self_attn.v_proj,0.00092119,0.01000,0.479
15,self_attn.q_proj,0.00995570,0.01000,0.539
15,self_attn.o_proj,0.00136074,0.01000,0.500
15,mlp.up_proj,0.04853380,0.01000,0.511
15,mlp.gate_proj,0.04559516,0.01000,0.495
15,mlp.down_proj,0.00638492,0.01000,3.148
16,self_attn.k_proj,0.00198390,0.01000,0.530
16,self_attn.v_proj,0.00113709,0.01000,0.507
16,self_attn.q_proj,0.01223878,0.01000,0.475
16,self_attn.o_proj,0.00148312,0.01000,0.489
16,mlp.up_proj,0.04892960,0.01000,0.541
16,mlp.gate_proj,0.05012077,0.01000,0.561
16,mlp.down_proj,0.00597043,0.01000,3.166
17,self_attn.k_proj,0.00280038,0.01000,0.496
17,self_attn.v_proj,0.00146818,0.01000,0.540
17,self_attn.q_proj,0.01687030,0.01000,0.497
17,self_attn.o_proj,0.00135879,0.01000,0.496
17,mlp.up_proj,0.04682782,0.01000,0.510
17,mlp.gate_proj,0.04579859,0.01000,0.492
17,mlp.down_proj,0.00761481,0.01000,3.238
18,self_attn.k_proj,0.00169533,0.01000,0.504
18,self_attn.v_proj,0.00126828,0.01000,0.471
18,self_attn.q_proj,0.01179836,0.01000,0.482
18,self_attn.o_proj,0.00126228,0.01000,0.522
18,mlp.up_proj,0.04505775,0.01000,0.512
18,mlp.gate_proj,0.04577068,0.01000,0.498
18,mlp.down_proj,0.00619347,0.01000,3.186
19,self_attn.k_proj,0.00236209,0.01000,0.514
19,self_attn.v_proj,0.00123736,0.01000,0.491
19,self_attn.q_proj,0.01400776,0.01000,0.526
19,self_attn.o_proj,0.00176100,0.01000,0.493
19,mlp.up_proj,0.04820779,0.01000,0.553
19,mlp.gate_proj,0.04570930,0.01000,0.600
19,mlp.down_proj,0.00793979,0.01000,3.357
20,self_attn.k_proj,0.00256892,0.01000,0.493
20,self_attn.v_proj,0.00260168,0.01000,0.550
20,self_attn.q_proj,0.02125032,0.01000,0.477
20,self_attn.o_proj,0.00280044,0.01000,0.497
20,mlp.up_proj,0.05057632,0.01000,0.519
20,mlp.gate_proj,0.04847589,0.01000,0.495
20,mlp.down_proj,0.00903307,0.01000,3.187
21,self_attn.k_proj,0.00277045,0.01000,0.500
21,self_attn.v_proj,0.00198452,0.01000,0.478
21,self_attn.q_proj,0.01851394,0.01000,0.479
21,self_attn.o_proj,0.00218527,0.01000,0.496
21,mlp.up_proj,0.05114579,0.01000,0.519
21,mlp.gate_proj,0.05338387,0.01000,0.499
21,mlp.down_proj,0.00733775,0.01000,3.188
22,self_attn.k_proj,0.00326175,0.01000,0.494
22,self_attn.v_proj,0.00250720,0.01000,0.475
22,self_attn.q_proj,0.02128556,0.01000,0.477
22,self_attn.o_proj,0.00235567,0.01000,0.492
22,mlp.up_proj,0.05586936,0.01000,0.570
22,mlp.gate_proj,0.05644500,0.01000,0.512
22,mlp.down_proj,0.00800653,0.01000,3.235
23,self_attn.k_proj,0.00299606,0.01000,0.494
23,self_attn.v_proj,0.00155715,0.01000,0.471
23,self_attn.q_proj,0.01925512,0.01000,0.473
23,self_attn.o_proj,0.00178259,0.01000,0.536
23,mlp.up_proj,0.06007682,0.01000,0.521
23,mlp.gate_proj,0.05663780,0.01000,0.496
23,mlp.down_proj,0.00945445,0.01000,9.186
24,self_attn.k_proj,0.00225264,0.01000,0.980
24,self_attn.v_proj,0.00187703,0.01000,1.371
24,self_attn.q_proj,0.01681715,0.01000,6.686
24,self_attn.o_proj,0.00246775,0.01000,1.328
24,mlp.up_proj,0.06072681,0.01000,0.944
24,mlp.gate_proj,0.05807892,0.01000,1.001
24,mlp.down_proj,0.00991773,0.01000,18.358
25,self_attn.k_proj,0.00229649,0.01000,8.503
25,self_attn.v_proj,0.00291831,0.01000,4.319
25,self_attn.q_proj,0.02437538,0.01000,3.804
25,self_attn.o_proj,0.00237260,0.01000,1.286
25,mlp.up_proj,0.06846089,0.01000,10.826
25,mlp.gate_proj,0.06569070,0.01000,9.100
25,mlp.down_proj,0.01337931,0.01000,33.601
26,self_attn.k_proj,0.00267915,0.01000,1.255
26,self_attn.v_proj,0.00322842,0.01000,3.481
26,self_attn.q_proj,0.02083185,0.01000,5.436
26,self_attn.o_proj,0.00308602,0.01000,7.156
26,mlp.up_proj,0.08263549,0.01000,1.335
26,mlp.gate_proj,0.07662739,0.01000,3.503
26,mlp.down_proj,0.01771094,0.01000,21.777
27,self_attn.k_proj,0.00287940,0.01000,3.159
27,self_attn.v_proj,0.00416089,0.01000,4.204
27,self_attn.q_proj,0.03279902,0.01000,1.774
27,self_attn.o_proj,0.00550491,0.01000,3.372
27,mlp.up_proj,0.09059777,0.01000,3.954
27,mlp.gate_proj,0.08867668,0.01000,9.505
27,mlp.down_proj,0.02109897,0.01000,30.538
28,self_attn.k_proj,0.00278399,0.01000,7.684
28,self_attn.v_proj,0.00438421,0.01000,1.185
28,self_attn.q_proj,0.02441998,0.01000,1.490
28,self_attn.o_proj,0.00504620,0.01000,1.659
28,mlp.up_proj,0.10423768,0.01000,6.048
28,mlp.gate_proj,0.10313836,0.01000,2.000
28,mlp.down_proj,0.02453683,0.01000,25.117
29,self_attn.k_proj,0.00324912,0.01000,7.286
29,self_attn.v_proj,0.00431707,0.01000,3.652
29,self_attn.q_proj,0.02698709,0.01000,9.020
29,self_attn.o_proj,0.00393811,0.01000,1.285
29,mlp.up_proj,0.13072219,0.01000,7.825
29,mlp.gate_proj,0.12731788,0.01000,1.260
29,mlp.down_proj,0.03455354,0.01000,31.130
30,self_attn.k_proj,0.00299078,0.01000,3.355
30,self_attn.v_proj,0.00842608,0.01000,1.227
30,self_attn.q_proj,0.02935425,0.01000,9.509
30,self_attn.o_proj,0.00491209,0.01000,6.748
30,mlp.up_proj,0.17074524,0.01000,1.335
30,mlp.gate_proj,0.15690112,0.01000,1.254
30,mlp.down_proj,0.09282688,0.01000,20.732
31,self_attn.k_proj,0.00382955,0.01000,8.693
31,self_attn.v_proj,0.01071948,0.01000,5.567
31,self_attn.q_proj,0.03053109,0.01000,1.216
31,self_attn.o_proj,0.00866138,0.01000,2.271
31,mlp.up_proj,0.20006534,0.01000,9.636
31,mlp.gate_proj,0.17307433,0.01000,4.535
31,mlp.down_proj,0.08568206,0.01000,26.561
32,self_attn.k_proj,0.00522043,0.01000,4.314
32,self_attn.v_proj,0.03462721,0.01000,9.529
32,self_attn.q_proj,0.04134069,0.01000,2.139
32,self_attn.o_proj,0.00988561,0.01000,2.949
32,mlp.up_proj,0.19264194,0.01000,2.229
32,mlp.gate_proj,0.16856745,0.01000,4.380
32,mlp.down_proj,0.08202425,0.01000,25.548
33,self_attn.k_proj,0.00480200,0.01000,1.251
33,self_attn.v_proj,0.07019998,0.01000,1.479
33,self_attn.q_proj,0.05121958,0.01000,7.949
33,self_attn.o_proj,0.01627044,0.01000,5.901
33,mlp.up_proj,0.17824389,0.01000,1.281
33,mlp.gate_proj,0.14435218,0.01000,3.857
33,mlp.down_proj,0.14946091,0.01000,24.800
34,self_attn.k_proj,0.00254513,0.01000,8.091
34,self_attn.v_proj,0.00760822,0.01000,1.215
34,self_attn.q_proj,0.02376374,0.01000,1.308
34,self_attn.o_proj,0.01036366,0.01000,12.004
34,mlp.up_proj,0.18489864,0.01000,3.845
34,mlp.gate_proj,0.15819445,0.01000,1.324
34,mlp.down_proj,0.09072845,0.01000,20.542
35,self_attn.k_proj,0.00257981,0.01000,1.463
35,self_attn.v_proj,0.00711143,0.01000,7.436
35,self_attn.q_proj,0.02256388,0.01000,4.156
35,self_attn.o_proj,0.00808490,0.01000,1.323
35,mlp.up_proj,0.23674777,0.01000,13.245
35,mlp.gate_proj,0.22639820,0.01000,13.503
35,mlp.down_proj,0.13450164,0.01000,23.163