Dinh's picture
Upload folder using huggingface_hub
7502872 verified
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.01096977,0.01000,1.238
0,self_attn.v_proj,0.00116295,0.01000,0.984
0,self_attn.q_proj,0.04623358,0.01000,1.007
0,self_attn.o_proj,0.00094825,0.01000,0.998
0,mlp.up_proj,0.07947180,0.01000,1.017
0,mlp.gate_proj,0.30171890,0.01000,1.013
0,mlp.down_proj,0.00165321,0.01000,6.762
1,self_attn.k_proj,0.00926878,0.01000,0.987
1,self_attn.v_proj,0.00165668,0.01000,0.982
1,self_attn.q_proj,0.03166184,0.01000,1.005
1,self_attn.o_proj,0.00028134,0.01000,0.998
1,mlp.up_proj,0.82403212,0.01000,1.019
1,mlp.gate_proj,1.45226679,0.01000,1.014
1,mlp.down_proj,0.22467122,0.01250,8.199
2,self_attn.k_proj,0.02382097,0.01000,0.987
2,self_attn.v_proj,0.00361796,0.01000,0.985
2,self_attn.q_proj,0.08421084,0.01000,1.008
2,self_attn.o_proj,0.00054472,0.01000,1.002
2,mlp.up_proj,0.96582470,0.01000,1.024
2,mlp.gate_proj,1.71110992,0.01000,1.016
2,mlp.down_proj,0.00167108,0.01000,6.744
3,self_attn.k_proj,0.02234304,0.01000,0.986
3,self_attn.v_proj,0.00449246,0.01000,0.987
3,self_attn.q_proj,0.07954597,0.01000,1.007
3,self_attn.o_proj,0.00142892,0.01000,1.004
3,mlp.up_proj,2.63362484,0.01000,1.019
3,mlp.gate_proj,3.74241524,0.01000,1.016
3,mlp.down_proj,0.02429631,0.01250,8.227
4,self_attn.k_proj,0.03934093,0.01000,0.996
4,self_attn.v_proj,0.01061609,0.01000,0.987
4,self_attn.q_proj,0.15539491,0.01000,1.013
4,self_attn.o_proj,0.00109535,0.01000,1.001
4,mlp.up_proj,2.24941082,0.01000,1.022
4,mlp.gate_proj,3.57545319,0.01000,1.021
4,mlp.down_proj,0.10124407,0.01250,8.207
5,self_attn.k_proj,0.03883768,0.01000,0.988
5,self_attn.v_proj,0.01303059,0.01000,0.984
5,self_attn.q_proj,0.17173260,0.01000,1.006
5,self_attn.o_proj,0.00131935,0.01000,0.999
5,mlp.up_proj,3.46055603,0.01000,1.022
5,mlp.gate_proj,4.57221298,0.01000,1.016
5,mlp.down_proj,0.00324235,0.01000,6.746
6,self_attn.k_proj,0.02526921,0.01000,0.996
6,self_attn.v_proj,0.01024575,0.01000,0.987
6,self_attn.q_proj,0.11551857,0.01000,1.007
6,self_attn.o_proj,0.00209021,0.01000,1.001
6,mlp.up_proj,0.80829830,0.01000,1.019
6,mlp.gate_proj,1.22725925,0.01000,1.020
6,mlp.down_proj,0.00968332,0.01000,6.740
7,self_attn.k_proj,0.02582688,0.01000,0.988
7,self_attn.v_proj,0.01961867,0.01000,0.985
7,self_attn.q_proj,0.13377922,0.01000,1.006
7,self_attn.o_proj,0.00392758,0.01000,0.999
7,mlp.up_proj,0.75072336,0.01000,1.021
7,mlp.gate_proj,0.86212215,0.01000,1.018
7,mlp.down_proj,0.01995223,0.01000,6.750
8,self_attn.k_proj,0.05134981,0.01000,0.992
8,self_attn.v_proj,0.01690738,0.01000,0.987
8,self_attn.q_proj,0.20182838,0.01000,1.006
8,self_attn.o_proj,0.00688519,0.01000,1.005
8,mlp.up_proj,0.93800974,0.01000,1.026
8,mlp.gate_proj,1.00855236,0.01000,1.023
8,mlp.down_proj,0.02311911,0.01000,6.758
9,self_attn.k_proj,0.03937526,0.01000,0.989
9,self_attn.v_proj,0.02913938,0.01000,0.983
9,self_attn.q_proj,0.19917443,0.01000,1.008
9,self_attn.o_proj,0.01041439,0.01000,1.000
9,mlp.up_proj,1.70104084,0.01000,1.022
9,mlp.gate_proj,2.93759079,0.01000,1.019
9,mlp.down_proj,0.01646033,0.01000,6.752
10,self_attn.k_proj,0.03967654,0.01000,0.989
10,self_attn.v_proj,0.01861299,0.01000,0.985
10,self_attn.q_proj,0.18400557,0.01000,1.010
10,self_attn.o_proj,0.00589501,0.01000,1.010
10,mlp.up_proj,0.98707781,0.01000,1.019
10,mlp.gate_proj,1.19088898,0.01000,1.014
10,mlp.down_proj,0.02149785,0.01000,6.753
11,self_attn.k_proj,0.05090361,0.01000,1.000
11,self_attn.v_proj,0.01593005,0.01000,0.993
11,self_attn.q_proj,0.19677665,0.01000,1.021
11,self_attn.o_proj,0.00978884,0.01000,1.016
11,mlp.up_proj,0.93029280,0.01000,1.032
11,mlp.gate_proj,1.02107821,0.01000,1.030
11,mlp.down_proj,0.02074635,0.01000,6.805
12,self_attn.k_proj,0.05454473,0.01000,0.999
12,self_attn.v_proj,0.02165007,0.01000,0.994
12,self_attn.q_proj,0.21794810,0.01000,1.022
12,self_attn.o_proj,0.01120252,0.01000,1.015
12,mlp.up_proj,0.95251245,0.01000,1.036
12,mlp.gate_proj,0.98560581,0.01000,1.027
12,mlp.down_proj,0.02144924,0.01000,6.799
13,self_attn.k_proj,0.04950626,0.01000,0.998
13,self_attn.v_proj,0.02763904,0.01000,0.994
13,self_attn.q_proj,0.23090868,0.01000,1.021
13,self_attn.o_proj,0.01685601,0.01000,1.012
13,mlp.up_proj,0.91604786,0.01000,1.033
13,mlp.gate_proj,1.03953857,0.01000,1.026
13,mlp.down_proj,0.01890075,0.01000,6.808
14,self_attn.k_proj,0.06788545,0.01000,0.999
14,self_attn.v_proj,0.02426277,0.01000,0.995
14,self_attn.q_proj,0.30167136,0.01000,1.021
14,self_attn.o_proj,0.01704209,0.01000,1.007
14,mlp.up_proj,0.97158155,0.01000,1.032
14,mlp.gate_proj,1.04032497,0.01000,1.026
14,mlp.down_proj,0.01923548,0.01000,6.794
15,self_attn.k_proj,0.06322566,0.01000,0.997
15,self_attn.v_proj,0.02059803,0.01000,1.000
15,self_attn.q_proj,0.24423466,0.01000,1.025
15,self_attn.o_proj,0.01134082,0.01000,1.015
15,mlp.up_proj,0.86951542,0.01000,1.038
15,mlp.gate_proj,0.89075184,0.01000,1.032
15,mlp.down_proj,0.01934366,0.01000,6.813
16,self_attn.k_proj,0.05464399,0.01000,1.002
16,self_attn.v_proj,0.02613713,0.01000,1.001
16,self_attn.q_proj,0.23992593,0.01000,1.025
16,self_attn.o_proj,0.02014990,0.01000,1.013
16,mlp.up_proj,0.90349989,0.01000,1.037
16,mlp.gate_proj,0.92065506,0.01000,1.036
16,mlp.down_proj,0.01899366,0.01000,6.797
17,self_attn.k_proj,0.05745988,0.01000,1.001
17,self_attn.v_proj,0.03283790,0.01000,0.997
17,self_attn.q_proj,0.28053503,0.01000,1.019
17,self_attn.o_proj,0.01373601,0.01000,1.011
17,mlp.up_proj,1.08258495,0.01000,1.031
17,mlp.gate_proj,1.07158165,0.01000,1.028
17,mlp.down_proj,0.02532004,0.01000,6.789
18,self_attn.k_proj,0.04298550,0.01000,1.001
18,self_attn.v_proj,0.03532872,0.01000,1.000
18,self_attn.q_proj,0.22009776,0.01000,1.022
18,self_attn.o_proj,0.02198225,0.01000,1.017
18,mlp.up_proj,1.15358105,0.01000,1.032
18,mlp.gate_proj,1.12741137,0.01000,1.029
18,mlp.down_proj,0.02706119,0.01000,6.798
19,self_attn.k_proj,0.04608336,0.01000,1.003
19,self_attn.v_proj,0.04248249,0.01000,1.003
19,self_attn.q_proj,0.27048311,0.01000,1.022
19,self_attn.o_proj,0.02985711,0.01000,1.013
19,mlp.up_proj,1.30711699,0.01000,1.040
19,mlp.gate_proj,1.34808874,0.01000,1.035
19,mlp.down_proj,0.03198723,0.01000,6.801
20,self_attn.k_proj,0.05036389,0.01000,1.002
20,self_attn.v_proj,0.04690300,0.01000,1.005
20,self_attn.q_proj,0.26944330,0.01000,1.025
20,self_attn.o_proj,0.01508863,0.01000,1.012
20,mlp.up_proj,1.60872002,0.01000,1.033
20,mlp.gate_proj,1.62411957,0.01000,1.028
20,mlp.down_proj,0.05501012,0.01000,6.793
21,self_attn.k_proj,0.05348732,0.01000,1.006
21,self_attn.v_proj,0.07228367,0.01000,0.999
21,self_attn.q_proj,0.31927242,0.01000,1.020
21,self_attn.o_proj,0.04879863,0.01000,1.014
21,mlp.up_proj,2.11614609,0.01000,1.032
21,mlp.gate_proj,2.26482544,0.01000,1.031
21,mlp.down_proj,0.07797968,0.01000,6.807
22,self_attn.k_proj,0.07840011,0.01000,1.006
22,self_attn.v_proj,0.12378967,0.01000,1.003
22,self_attn.q_proj,0.47206717,0.01000,1.021
22,self_attn.o_proj,0.02746164,0.01000,1.009
22,mlp.up_proj,2.98232899,0.01000,1.028
22,mlp.gate_proj,3.18851070,0.01000,1.035
22,mlp.down_proj,0.12279578,0.01000,6.815
23,self_attn.k_proj,0.11656542,0.01000,1.008
23,self_attn.v_proj,0.18187238,0.01000,0.999
23,self_attn.q_proj,0.59631906,0.01000,1.011
23,self_attn.o_proj,0.08684207,0.01000,1.003
23,mlp.up_proj,4.30042763,0.01000,1.027
23,mlp.gate_proj,4.74122772,0.01000,1.032
23,mlp.down_proj,0.15644772,0.01000,6.780
24,self_attn.k_proj,0.08580490,0.01000,1.016
24,self_attn.v_proj,0.17929344,0.01000,0.994
24,self_attn.q_proj,0.53899407,0.01000,1.011
24,self_attn.o_proj,0.06268171,0.01000,1.006
24,mlp.up_proj,5.05830460,0.01000,1.034
24,mlp.gate_proj,5.07611618,0.01000,1.038
24,mlp.down_proj,0.20694437,0.01000,6.785
25,self_attn.k_proj,0.10329957,0.01000,1.003
25,self_attn.v_proj,0.32539802,0.01000,1.002
25,self_attn.q_proj,0.63915033,0.01000,1.020
25,self_attn.o_proj,0.08432423,0.01000,1.018
25,mlp.up_proj,6.63615265,0.01000,1.036
25,mlp.gate_proj,6.30570679,0.01000,1.036
25,mlp.down_proj,0.31110430,0.01000,6.795
26,self_attn.k_proj,0.15026597,0.01000,1.006
26,self_attn.v_proj,0.76809883,0.01000,1.003
26,self_attn.q_proj,0.97067184,0.01000,1.023
26,self_attn.o_proj,0.13277307,0.01000,1.019
26,mlp.up_proj,6.72053528,0.01000,1.035
26,mlp.gate_proj,6.24930115,0.01000,1.031
26,mlp.down_proj,0.00063611,0.01250,8.256
27,self_attn.k_proj,0.20015345,0.01000,1.003
27,self_attn.v_proj,1.26770134,0.01000,0.997
27,self_attn.q_proj,1.94311104,0.01000,1.017
27,self_attn.o_proj,0.21284146,0.01000,1.013
27,mlp.up_proj,7.55787125,0.01000,1.033
27,mlp.gate_proj,7.68255539,0.01000,1.030
27,mlp.down_proj,1.65506172,0.01000,6.788