Dinh's picture
Upload folder using huggingface_hub
7e1604a verified
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.01274909,0.01000,1.240
0,self_attn.v_proj,0.00214360,0.01000,0.996
0,self_attn.q_proj,0.05843823,0.01000,1.021
0,self_attn.o_proj,0.00274049,0.01000,1.016
0,mlp.up_proj,0.10601919,0.01000,1.031
0,mlp.gate_proj,0.39847262,0.01000,1.027
0,mlp.down_proj,0.00772479,0.01000,6.810
1,self_attn.k_proj,0.01021324,0.01000,1.005
1,self_attn.v_proj,0.00257124,0.01000,0.996
1,self_attn.q_proj,0.03741558,0.01000,1.018
1,self_attn.o_proj,0.00084842,0.01000,1.010
1,mlp.up_proj,1.43357658,0.01000,1.028
1,mlp.gate_proj,2.12231598,0.01000,1.024
1,mlp.down_proj,0.00496998,0.01000,6.781
2,self_attn.k_proj,0.02703509,0.01000,1.000
2,self_attn.v_proj,0.00504902,0.01000,0.989
2,self_attn.q_proj,0.10213473,0.01000,1.013
2,self_attn.o_proj,0.00193177,0.01000,1.005
2,mlp.up_proj,1.58620987,0.01000,1.024
2,mlp.gate_proj,2.42828255,0.01000,1.024
2,mlp.down_proj,0.00601656,0.01000,6.742
3,self_attn.k_proj,0.02690557,0.01000,1.003
3,self_attn.v_proj,0.00689736,0.01000,0.996
3,self_attn.q_proj,0.10322268,0.01000,1.010
3,self_attn.o_proj,0.00642131,0.01000,1.006
3,mlp.up_proj,3.65950470,0.01000,1.026
3,mlp.gate_proj,4.60566330,0.01000,1.035
3,mlp.down_proj,0.02601060,0.01250,8.208
4,self_attn.k_proj,0.04614114,0.01000,1.029
4,self_attn.v_proj,0.01480776,0.01000,1.029
4,self_attn.q_proj,0.20456531,0.01000,1.046
4,self_attn.o_proj,0.00448910,0.01000,1.028
4,mlp.up_proj,2.91298180,0.01000,1.037
4,mlp.gate_proj,4.05700836,0.01000,1.031
4,mlp.down_proj,0.07724582,0.01250,8.358
5,self_attn.k_proj,0.03892767,0.01000,1.027
5,self_attn.v_proj,0.01592588,0.01000,1.025
5,self_attn.q_proj,0.18976243,0.01000,1.043
5,self_attn.o_proj,0.00436232,0.01000,1.037
5,mlp.up_proj,4.21060410,0.01000,1.034
5,mlp.gate_proj,4.93323860,0.01000,1.031
5,mlp.down_proj,0.00724246,0.01000,6.897
6,self_attn.k_proj,0.02429707,0.01000,1.006
6,self_attn.v_proj,0.01225167,0.01000,1.016
6,self_attn.q_proj,0.12069086,0.01000,1.038
6,self_attn.o_proj,0.00645695,0.01000,1.033
6,mlp.up_proj,0.82594872,0.01000,1.054
6,mlp.gate_proj,1.10117245,0.01000,1.053
6,mlp.down_proj,0.01846275,0.01000,6.903
7,self_attn.k_proj,0.02329313,0.01000,1.026
7,self_attn.v_proj,0.02144220,0.01000,1.024
7,self_attn.q_proj,0.13331867,0.01000,1.042
7,self_attn.o_proj,0.01251567,0.01000,1.016
7,mlp.up_proj,0.73551784,0.01000,1.049
7,mlp.gate_proj,0.77921600,0.01000,1.049
7,mlp.down_proj,0.03439705,0.01000,6.873
8,self_attn.k_proj,0.04569775,0.01000,1.007
8,self_attn.v_proj,0.01890234,0.01000,0.997
8,self_attn.q_proj,0.20662723,0.01000,1.018
8,self_attn.o_proj,0.01772243,0.01000,1.012
8,mlp.up_proj,0.90030460,0.01000,1.032
8,mlp.gate_proj,0.90461788,0.01000,1.027
8,mlp.down_proj,0.03843986,0.01000,7.045
9,self_attn.k_proj,0.03546313,0.01000,1.106
9,self_attn.v_proj,0.02996131,0.01000,1.099
9,self_attn.q_proj,0.19824698,0.01000,1.097
9,self_attn.o_proj,0.02716671,0.01000,1.083
9,mlp.up_proj,1.70254269,0.01000,1.121
9,mlp.gate_proj,2.61145973,0.01000,1.129
9,mlp.down_proj,0.03424822,0.01000,7.254
10,self_attn.k_proj,0.03381699,0.01000,1.009
10,self_attn.v_proj,0.01937524,0.01000,0.995
10,self_attn.q_proj,0.17410449,0.01000,1.014
10,self_attn.o_proj,0.01720826,0.01000,1.004
10,mlp.up_proj,0.92787247,0.01000,1.026
10,mlp.gate_proj,1.02021523,0.01000,1.026
10,mlp.down_proj,0.03707029,0.01000,6.859
11,self_attn.k_proj,0.04158755,0.01000,1.017
11,self_attn.v_proj,0.01662142,0.01000,1.005
11,self_attn.q_proj,0.18437350,0.01000,1.025
11,self_attn.o_proj,0.02335539,0.01000,1.019
11,mlp.up_proj,0.86569471,0.01000,1.039
11,mlp.gate_proj,0.89345131,0.01000,1.039
11,mlp.down_proj,0.03659432,0.01000,6.815
12,self_attn.k_proj,0.04609491,0.01000,1.021
12,self_attn.v_proj,0.02227776,0.01000,1.010
12,self_attn.q_proj,0.21181834,0.01000,1.032
12,self_attn.o_proj,0.02827374,0.01000,1.034
12,mlp.up_proj,0.89145584,0.01000,1.053
12,mlp.gate_proj,0.87042551,0.01000,1.041
12,mlp.down_proj,0.04059390,0.01000,6.844
13,self_attn.k_proj,0.04291532,0.01000,1.021
13,self_attn.v_proj,0.02938266,0.01000,1.006
13,self_attn.q_proj,0.23358922,0.01000,1.030
13,self_attn.o_proj,0.04167673,0.01000,1.021
13,mlp.up_proj,0.87737236,0.01000,1.047
13,mlp.gate_proj,0.91676216,0.01000,1.041
13,mlp.down_proj,0.03859301,0.01000,6.835
14,self_attn.k_proj,0.05915552,0.01000,1.021
14,self_attn.v_proj,0.02708837,0.01000,1.007
14,self_attn.q_proj,0.31210327,0.01000,1.032
14,self_attn.o_proj,0.04240547,0.01000,1.026
14,mlp.up_proj,0.96120968,0.01000,1.047
14,mlp.gate_proj,0.95211182,0.01000,1.041
14,mlp.down_proj,0.04331824,0.01000,6.850
15,self_attn.k_proj,0.05826247,0.01000,1.021
15,self_attn.v_proj,0.02519295,0.01000,1.011
15,self_attn.q_proj,0.26803920,0.01000,1.032
15,self_attn.o_proj,0.03413584,0.01000,1.029
15,mlp.up_proj,0.90848255,0.01000,1.046
15,mlp.gate_proj,0.87616615,0.01000,1.041
15,mlp.down_proj,0.04859902,0.01000,6.852
16,self_attn.k_proj,0.05079299,0.01000,1.011
16,self_attn.v_proj,0.03077720,0.01000,0.995
16,self_attn.q_proj,0.26502216,0.01000,1.019
16,self_attn.o_proj,0.05226343,0.01000,1.014
16,mlp.up_proj,0.94974709,0.01000,1.030
16,mlp.gate_proj,0.91194410,0.01000,1.025
16,mlp.down_proj,0.04420947,0.01000,6.780
17,self_attn.k_proj,0.05318869,0.01000,1.019
17,self_attn.v_proj,0.03864379,0.01000,1.012
17,self_attn.q_proj,0.30886962,0.01000,1.033
17,self_attn.o_proj,0.03887460,0.01000,1.029
17,mlp.up_proj,1.16065416,0.01000,1.044
17,mlp.gate_proj,1.08571386,0.01000,1.042
17,mlp.down_proj,0.06242081,0.01000,6.849
18,self_attn.k_proj,0.04165920,0.01000,1.023
18,self_attn.v_proj,0.04310030,0.01000,1.013
18,self_attn.q_proj,0.25575843,0.01000,1.035
18,self_attn.o_proj,0.05644683,0.01000,1.029
18,mlp.up_proj,1.26025496,0.01000,1.052
18,mlp.gate_proj,1.15192699,0.01000,1.039
18,mlp.down_proj,0.07166648,0.01000,6.836
19,self_attn.k_proj,0.04222881,0.01000,1.025
19,self_attn.v_proj,0.05446572,0.01000,1.015
19,self_attn.q_proj,0.30983603,0.01000,1.034
19,self_attn.o_proj,0.06438451,0.01000,1.036
19,mlp.up_proj,1.43575058,0.01000,1.052
19,mlp.gate_proj,1.36489668,0.01000,1.043
19,mlp.down_proj,0.07850655,0.01000,6.877
20,self_attn.k_proj,0.04729198,0.01000,1.022
20,self_attn.v_proj,0.06206809,0.01000,1.013
20,self_attn.q_proj,0.31196122,0.01000,1.035
20,self_attn.o_proj,0.03323518,0.01000,1.027
20,mlp.up_proj,1.82752800,0.01000,1.054
20,mlp.gate_proj,1.70066452,0.01000,1.043
20,mlp.down_proj,0.13648720,0.01000,6.867
21,self_attn.k_proj,0.05044293,0.01000,1.022
21,self_attn.v_proj,0.09859020,0.01000,1.014
21,self_attn.q_proj,0.37178845,0.01000,1.038
21,self_attn.o_proj,0.15084021,0.01000,1.032
21,mlp.up_proj,2.46773129,0.01000,1.049
21,mlp.gate_proj,2.41258640,0.01000,1.048
21,mlp.down_proj,0.19357001,0.01000,6.873
22,self_attn.k_proj,0.07108734,0.01000,1.024
22,self_attn.v_proj,0.16268752,0.01000,1.021
22,self_attn.q_proj,0.52809725,0.01000,1.036
22,self_attn.o_proj,0.07668910,0.01000,1.030
22,mlp.up_proj,3.47492867,0.01000,1.051
22,mlp.gate_proj,3.37544518,0.01000,1.046
22,mlp.down_proj,0.30478077,0.01000,6.880
23,self_attn.k_proj,0.10465989,0.01000,1.033
23,self_attn.v_proj,0.24405675,0.01000,1.020
23,self_attn.q_proj,0.67093091,0.01000,1.038
23,self_attn.o_proj,0.19958943,0.01000,1.029
23,mlp.up_proj,4.96244507,0.01000,1.051
23,mlp.gate_proj,4.98119621,0.01000,1.047
23,mlp.down_proj,0.39886584,0.01000,6.879
24,self_attn.k_proj,0.07962582,0.01000,1.038
24,self_attn.v_proj,0.22561178,0.01000,1.020
24,self_attn.q_proj,0.59075594,0.01000,1.039
24,self_attn.o_proj,0.13933611,0.01000,1.031
24,mlp.up_proj,5.51158943,0.01000,1.051
24,mlp.gate_proj,5.17049103,0.01000,1.052
24,mlp.down_proj,0.53541055,0.01000,6.873
25,self_attn.k_proj,0.09734185,0.01000,1.031
25,self_attn.v_proj,0.38716655,0.01000,1.017
25,self_attn.q_proj,0.70420899,0.01000,1.040
25,self_attn.o_proj,0.20143418,0.01000,1.028
25,mlp.up_proj,7.28550262,0.01000,1.061
25,mlp.gate_proj,6.50514603,0.01000,1.046
25,mlp.down_proj,0.78691392,0.01000,6.865
26,self_attn.k_proj,0.14025826,0.01000,1.039
26,self_attn.v_proj,0.94293957,0.01000,1.011
26,self_attn.q_proj,1.12750330,0.01000,1.031
26,self_attn.o_proj,0.32603059,0.01000,1.026
26,mlp.up_proj,7.41025085,0.01000,1.042
26,mlp.gate_proj,6.49971008,0.01000,1.036
26,mlp.down_proj,0.00078956,0.01250,8.283
27,self_attn.k_proj,0.18448967,0.01000,1.015
27,self_attn.v_proj,1.47590675,0.01000,1.001
27,self_attn.q_proj,1.86292515,0.01000,1.032
27,self_attn.o_proj,0.44092617,0.01000,1.026
27,mlp.up_proj,9.63612976,0.01000,1.038
27,mlp.gate_proj,9.16495056,0.01000,1.033
27,mlp.down_proj,4.99868469,0.01000,6.823