| layer,module,loss,samples,damp,time | |
| 0,self_attn.k_proj,0.0000000685,0.05000,1.952 | |
| 0,self_attn.v_proj,0.0000000051,0.05000,1.721 | |
| 0,self_attn.q_proj,0.0000003521,0.05000,1.779 | |
| 0,self_attn.o_proj,0.0000000051,0.05000,1.790 | |
| 0,mlp.gate_proj,0.0000002079,0.05000,2.237 | |
| 0,mlp.up_proj,0.0000001977,0.05000,1.960 | |
| 0,mlp.down_proj,0.0000000034,0.05000,10.567 | |
| 1,self_attn.k_proj,0.0000000373,0.05000,1.738 | |
| 1,self_attn.v_proj,0.0000000025,0.05000,1.740 | |
| 1,self_attn.q_proj,0.0000001444,0.05000,1.788 | |
| 1,self_attn.o_proj,0.0000000007,0.05000,1.782 | |
| 1,mlp.gate_proj,0.0000006684,0.05000,1.988 | |
| 1,mlp.up_proj,0.0000006192,0.05000,1.969 | |
| 1,mlp.down_proj,0.0002015895,0.05000,10.579 | |
| 2,self_attn.k_proj,0.0000020729,0.05000,1.724 | |
| 2,self_attn.v_proj,0.0000007911,0.05000,1.714 | |
| 2,self_attn.q_proj,0.0000070333,0.05000,1.775 | |
| 2,self_attn.o_proj,0.0000000117,0.05000,1.795 | |
| 2,mlp.gate_proj,0.0000012298,0.05000,1.968 | |
| 2,mlp.up_proj,0.0000011734,0.05000,1.972 | |
| 2,mlp.down_proj,0.0000000298,0.05000,10.620 | |
| 3,self_attn.k_proj,0.0000015801,0.05000,1.755 | |
| 3,self_attn.v_proj,0.0000006056,0.05000,1.764 | |
| 3,self_attn.q_proj,0.0000047879,0.05000,1.813 | |
| 3,self_attn.o_proj,0.0000000308,0.05000,1.813 | |
| 3,mlp.gate_proj,0.0000019761,0.05000,1.979 | |
| 3,mlp.up_proj,0.0000019347,0.05000,1.974 | |
| 3,mlp.down_proj,0.0000000406,0.05000,10.661 | |
| 4,self_attn.k_proj,0.0000022731,0.05000,1.872 | |
| 4,self_attn.v_proj,0.0000010830,0.05000,1.864 | |
| 4,self_attn.q_proj,0.0000093928,0.05000,1.906 | |
| 4,self_attn.o_proj,0.0000000120,0.05000,1.927 | |
| 4,mlp.gate_proj,0.0000038092,0.05000,2.084 | |
| 4,mlp.up_proj,0.0000037036,0.05000,2.076 | |
| 4,mlp.down_proj,0.0000000750,0.05000,10.953 | |
| 5,self_attn.k_proj,0.0000031021,0.05000,1.733 | |
| 5,self_attn.v_proj,0.0000017217,0.05000,1.725 | |
| 5,self_attn.q_proj,0.0000123386,0.05000,1.788 | |
| 5,self_attn.o_proj,0.0000000084,0.05000,1.795 | |
| 5,mlp.gate_proj,0.0000062782,0.05000,1.972 | |
| 5,mlp.up_proj,0.0000060347,0.05000,1.947 | |
| 5,mlp.down_proj,0.0000001456,0.05000,10.600 | |
| 6,self_attn.k_proj,0.0000020967,0.05000,1.728 | |
| 6,self_attn.v_proj,0.0000010817,0.05000,1.713 | |
| 6,self_attn.q_proj,0.0000080667,0.05000,1.803 | |
| 6,self_attn.o_proj,0.0000000132,0.05000,1.806 | |
| 6,mlp.gate_proj,0.0000083323,0.05000,1.982 | |
| 6,mlp.up_proj,0.0000080155,0.05000,1.969 | |
| 6,mlp.down_proj,0.0000002012,0.05000,10.563 | |
| 7,self_attn.k_proj,0.0000029421,0.05000,1.741 | |
| 7,self_attn.v_proj,0.0000014289,0.05000,1.724 | |
| 7,self_attn.q_proj,0.0000117084,0.05000,1.821 | |
| 7,self_attn.o_proj,0.0000000213,0.05000,1.799 | |
| 7,mlp.gate_proj,0.0000104807,0.05000,1.985 | |
| 7,mlp.up_proj,0.0000101542,0.05000,1.986 | |
| 7,mlp.down_proj,0.0000002535,0.05000,10.585 | |
| 8,self_attn.k_proj,0.0000027552,0.05000,1.744 | |
| 8,self_attn.v_proj,0.0000014088,0.05000,1.738 | |
| 8,self_attn.q_proj,0.0000106035,0.05000,1.794 | |
| 8,self_attn.o_proj,0.0000000926,0.05000,1.805 | |
| 8,mlp.gate_proj,0.0000121578,0.05000,1.984 | |
| 8,mlp.up_proj,0.0000115947,0.05000,1.978 | |
| 8,mlp.down_proj,0.0000003185,0.05000,10.654 | |
| 9,self_attn.k_proj,0.0000073975,0.05000,1.814 | |
| 9,self_attn.v_proj,0.0000041334,0.05000,1.730 | |
| 9,self_attn.q_proj,0.0000333733,0.05000,1.799 | |
| 9,self_attn.o_proj,0.0000001372,0.05000,1.803 | |
| 9,mlp.gate_proj,0.0000130155,0.05000,1.955 | |
| 9,mlp.up_proj,0.0000125228,0.05000,1.950 | |
| 9,mlp.down_proj,0.0000003395,0.05000,10.714 | |
| 10,self_attn.k_proj,0.0000043694,0.05000,1.737 | |
| 10,self_attn.v_proj,0.0000022361,0.05000,1.723 | |
| 10,self_attn.q_proj,0.0000186031,0.05000,1.816 | |
| 10,self_attn.o_proj,0.0000001746,0.05000,1.795 | |
| 10,mlp.gate_proj,0.0000156931,0.05000,1.980 | |
| 10,mlp.up_proj,0.0000150417,0.05000,1.966 | |
| 10,mlp.down_proj,0.0000004690,0.05000,10.710 | |
| 11,self_attn.k_proj,0.0000051370,0.05000,1.747 | |
| 11,self_attn.v_proj,0.0000023946,0.05000,1.736 | |
| 11,self_attn.q_proj,0.0000224542,0.05000,1.796 | |
| 11,self_attn.o_proj,0.0000001991,0.05000,1.796 | |
| 11,mlp.gate_proj,0.0000179378,0.05000,1.990 | |
| 11,mlp.up_proj,0.0000170724,0.05000,1.969 | |
| 11,mlp.down_proj,0.0000006015,0.05000,10.676 | |
| 12,self_attn.k_proj,0.0000068544,0.05000,1.859 | |
| 12,self_attn.v_proj,0.0000036612,0.05000,1.839 | |
| 12,self_attn.q_proj,0.0000317736,0.05000,1.908 | |
| 12,self_attn.o_proj,0.0000003027,0.05000,1.918 | |
| 12,mlp.gate_proj,0.0000199806,0.05000,2.102 | |
| 12,mlp.up_proj,0.0000191298,0.05000,2.082 | |
| 12,mlp.down_proj,0.0000007129,0.05000,11.001 | |
| 13,self_attn.k_proj,0.0000063864,0.05000,1.730 | |
| 13,self_attn.v_proj,0.0000034330,0.05000,1.719 | |
| 13,self_attn.q_proj,0.0000289530,0.05000,1.980 | |
| 13,self_attn.o_proj,0.0000002358,0.05000,1.790 | |
| 13,mlp.gate_proj,0.0000228015,0.05000,2.018 | |
| 13,mlp.up_proj,0.0000218623,0.05000,1.950 | |
| 13,mlp.down_proj,0.0000009059,0.05000,10.562 | |
| 14,self_attn.k_proj,0.0000061387,0.05000,1.805 | |
| 14,self_attn.v_proj,0.0000032689,0.05000,1.739 | |
| 14,self_attn.q_proj,0.0000278935,0.05000,2.213 | |
| 14,self_attn.o_proj,0.0000004098,0.05000,1.805 | |
| 14,mlp.gate_proj,0.0000234183,0.05000,2.002 | |
| 14,mlp.up_proj,0.0000224868,0.05000,1.981 | |
| 14,mlp.down_proj,0.0000009782,0.05000,10.644 | |
| 15,self_attn.k_proj,0.0000076575,0.05000,1.760 | |
| 15,self_attn.v_proj,0.0000041983,0.05000,1.746 | |
| 15,self_attn.q_proj,0.0000377521,0.05000,1.809 | |
| 15,self_attn.o_proj,0.0000003109,0.05000,1.816 | |
| 15,mlp.gate_proj,0.0000293268,0.05000,2.150 | |
| 15,mlp.up_proj,0.0000280428,0.05000,1.963 | |
| 15,mlp.down_proj,0.0000012089,0.05000,10.600 | |
| 16,self_attn.k_proj,0.0000071514,0.05000,1.771 | |
| 16,self_attn.v_proj,0.0000036904,0.05000,1.765 | |
| 16,self_attn.q_proj,0.0000334941,0.05000,1.815 | |
| 16,self_attn.o_proj,0.0000003754,0.05000,1.823 | |
| 16,mlp.gate_proj,0.0000318242,0.05000,2.024 | |
| 16,mlp.up_proj,0.0000304060,0.05000,2.003 | |
| 16,mlp.down_proj,0.0000014082,0.05000,10.840 | |
| 17,self_attn.k_proj,0.0000058214,0.05000,1.763 | |
| 17,self_attn.v_proj,0.0000035011,0.05000,1.745 | |
| 17,self_attn.q_proj,0.0000266938,0.05000,1.815 | |
| 17,self_attn.o_proj,0.0000004904,0.05000,1.805 | |
| 17,mlp.gate_proj,0.0000305605,0.05000,2.189 | |
| 17,mlp.up_proj,0.0000294420,0.05000,1.994 | |
| 17,mlp.down_proj,0.0000015261,0.05000,10.648 | |
| 18,self_attn.k_proj,0.0000113896,0.05000,1.742 | |
| 18,self_attn.v_proj,0.0000064052,0.05000,1.727 | |
| 18,self_attn.q_proj,0.0000516542,0.05000,1.795 | |
| 18,self_attn.o_proj,0.0000004344,0.05000,1.796 | |
| 18,mlp.gate_proj,0.0000367808,0.05000,1.973 | |
| 18,mlp.up_proj,0.0000351525,0.05000,1.962 | |
| 18,mlp.down_proj,0.0000018911,0.05000,10.552 | |
| 19,self_attn.k_proj,0.0000147619,0.05000,1.741 | |
| 19,self_attn.v_proj,0.0000090224,0.05000,1.746 | |
| 19,self_attn.q_proj,0.0000708490,0.05000,1.792 | |
| 19,self_attn.o_proj,0.0000004645,0.05000,1.792 | |
| 19,mlp.gate_proj,0.0000423705,0.05000,1.967 | |
| 19,mlp.up_proj,0.0000406029,0.05000,1.968 | |
| 19,mlp.down_proj,0.0000027029,0.05000,10.781 | |
| 20,self_attn.k_proj,0.0000055276,0.05000,1.750 | |
| 20,self_attn.v_proj,0.0000033355,0.05000,1.743 | |
| 20,self_attn.q_proj,0.0000273500,0.05000,1.793 | |
| 20,self_attn.o_proj,0.0000006263,0.05000,1.793 | |
| 20,mlp.gate_proj,0.0000512864,0.05000,2.252 | |
| 20,mlp.up_proj,0.0000486326,0.05000,1.969 | |
| 20,mlp.down_proj,0.0000035893,0.05000,10.766 | |
| 21,self_attn.k_proj,0.0000045427,0.05000,1.768 | |
| 21,self_attn.v_proj,0.0000029989,0.05000,1.780 | |
| 21,self_attn.q_proj,0.0000227807,0.05000,1.806 | |
| 21,self_attn.o_proj,0.0000011423,0.05000,1.793 | |
| 21,mlp.gate_proj,0.0000463502,0.05000,2.002 | |
| 21,mlp.up_proj,0.0000443138,0.05000,1.962 | |
| 21,mlp.down_proj,0.0000035231,0.05000,10.620 | |
| 22,self_attn.k_proj,0.0000118840,0.05000,1.769 | |
| 22,self_attn.v_proj,0.0000075208,0.05000,1.737 | |
| 22,self_attn.q_proj,0.0000649774,0.05000,1.802 | |
| 22,self_attn.o_proj,0.0000013580,0.05000,1.791 | |
| 22,mlp.gate_proj,0.0000637017,0.05000,2.294 | |
| 22,mlp.up_proj,0.0000610995,0.05000,1.964 | |
| 22,mlp.down_proj,0.0000066878,0.05000,10.608 | |
| 23,self_attn.k_proj,0.0000096768,0.05000,1.758 | |
| 23,self_attn.v_proj,0.0000066151,0.05000,1.746 | |
| 23,self_attn.q_proj,0.0000553509,0.05000,1.801 | |
| 23,self_attn.o_proj,0.0000017100,0.05000,1.799 | |
| 23,mlp.gate_proj,0.0000711954,0.05000,2.026 | |
| 23,mlp.up_proj,0.0000675318,0.05000,1.981 | |
| 23,mlp.down_proj,0.0000065035,0.05000,10.602 | |
| 24,self_attn.k_proj,0.0000083006,0.05000,1.753 | |
| 24,self_attn.v_proj,0.0000067867,0.05000,1.741 | |
| 24,self_attn.q_proj,0.0000467073,0.05000,1.793 | |
| 24,self_attn.o_proj,0.0000016390,0.05000,1.797 | |
| 24,mlp.gate_proj,0.0000832089,0.05000,1.972 | |
| 24,mlp.up_proj,0.0000782947,0.05000,1.960 | |
| 24,mlp.down_proj,0.0000072162,0.05000,10.594 | |
| 25,self_attn.k_proj,0.0000148592,0.05000,1.930 | |
| 25,self_attn.v_proj,0.0000096430,0.05000,1.742 | |
| 25,self_attn.q_proj,0.0000845463,0.05000,1.797 | |
| 25,self_attn.o_proj,0.0000019787,0.05000,1.794 | |
| 25,mlp.gate_proj,0.0000984830,0.05000,1.975 | |
| 25,mlp.up_proj,0.0000933006,0.05000,1.967 | |
| 25,mlp.down_proj,0.0000084473,0.05000,10.587 | |
| 26,self_attn.k_proj,0.0000107672,0.05000,1.781 | |
| 26,self_attn.v_proj,0.0000072195,0.05000,1.763 | |
| 26,self_attn.q_proj,0.0000593120,0.05000,1.823 | |
| 26,self_attn.o_proj,0.0000023962,0.05000,1.816 | |
| 26,mlp.gate_proj,0.0001110225,0.05000,1.998 | |
| 26,mlp.up_proj,0.0001054887,0.05000,1.983 | |
| 26,mlp.down_proj,0.0000088992,0.05000,10.699 | |
| 27,self_attn.k_proj,0.0000106991,0.05000,1.944 | |
| 27,self_attn.v_proj,0.0000075662,0.05000,1.731 | |
| 27,self_attn.q_proj,0.0000575445,0.05000,1.781 | |
| 27,self_attn.o_proj,0.0000020078,0.05000,1.789 | |
| 27,mlp.gate_proj,0.0001217312,0.05000,1.969 | |
| 27,mlp.up_proj,0.0001160810,0.05000,1.964 | |
| 27,mlp.down_proj,0.0000096916,0.05000,10.565 | |
| 28,self_attn.k_proj,0.0000104979,0.05000,1.767 | |
| 28,self_attn.v_proj,0.0000081629,0.05000,1.760 | |
| 28,self_attn.q_proj,0.0000589817,0.05000,1.814 | |
| 28,self_attn.o_proj,0.0000016211,0.05000,1.817 | |
| 28,mlp.gate_proj,0.0001300697,0.05000,2.004 | |
| 28,mlp.up_proj,0.0001248194,0.05000,1.968 | |
| 28,mlp.down_proj,0.0000111233,0.05000,10.678 | |
| 29,self_attn.k_proj,0.0000137042,0.05000,1.752 | |
| 29,self_attn.v_proj,0.0000089406,0.05000,1.733 | |
| 29,self_attn.q_proj,0.0000729328,0.05000,1.784 | |
| 29,self_attn.o_proj,0.0000026417,0.05000,1.797 | |
| 29,mlp.gate_proj,0.0001383661,0.05000,1.988 | |
| 29,mlp.up_proj,0.0001325025,0.05000,1.966 | |
| 29,mlp.down_proj,0.0000118384,0.05000,11.022 | |
| 30,self_attn.k_proj,0.0000135094,0.05000,1.777 | |
| 30,self_attn.v_proj,0.0000106211,0.05000,1.751 | |
| 30,self_attn.q_proj,0.0000781156,0.05000,1.796 | |
| 30,self_attn.o_proj,0.0000030378,0.05000,1.798 | |
| 30,mlp.gate_proj,0.0001510154,0.05000,1.980 | |
| 30,mlp.up_proj,0.0001430569,0.05000,1.968 | |
| 30,mlp.down_proj,0.0000125046,0.05000,10.932 | |
| 31,self_attn.k_proj,0.0000150631,0.05000,1.762 | |
| 31,self_attn.v_proj,0.0000115141,0.05000,1.744 | |
| 31,self_attn.q_proj,0.0000834578,0.05000,1.799 | |
| 31,self_attn.o_proj,0.0000020846,0.05000,1.790 | |
| 31,mlp.gate_proj,0.0001636284,0.05000,2.262 | |
| 31,mlp.up_proj,0.0001546849,0.05000,1.962 | |
| 31,mlp.down_proj,0.0000131806,0.05000,10.579 | |
| 32,self_attn.k_proj,0.0000166102,0.05000,1.781 | |
| 32,self_attn.v_proj,0.0000128024,0.05000,1.740 | |
| 32,self_attn.q_proj,0.0000919194,0.05000,1.790 | |
| 32,self_attn.o_proj,0.0000023728,0.05000,1.815 | |
| 32,mlp.gate_proj,0.0001712901,0.05000,1.978 | |
| 32,mlp.up_proj,0.0001622502,0.05000,1.971 | |
| 32,mlp.down_proj,0.0000140184,0.05000,10.771 | |
| 33,self_attn.k_proj,0.0000155397,0.05000,1.807 | |
| 33,self_attn.v_proj,0.0000141580,0.05000,1.770 | |
| 33,self_attn.q_proj,0.0000830037,0.05000,1.835 | |
| 33,self_attn.o_proj,0.0000017610,0.05000,1.820 | |
| 33,mlp.gate_proj,0.0001827080,0.05000,2.015 | |
| 33,mlp.up_proj,0.0001707335,0.05000,1.991 | |
| 33,mlp.down_proj,0.0000144502,0.05000,10.621 | |
| 34,self_attn.k_proj,0.0000175148,0.05000,3.051 | |
| 34,self_attn.v_proj,0.0000159380,0.05000,1.756 | |
| 34,self_attn.q_proj,0.0000969024,0.05000,1.819 | |
| 34,self_attn.o_proj,0.0000012757,0.05000,1.814 | |
| 34,mlp.gate_proj,0.0001907635,0.05000,1.991 | |
| 34,mlp.up_proj,0.0001778772,0.05000,1.972 | |
| 34,mlp.down_proj,0.0000154265,0.05000,10.691 | |
| 35,self_attn.k_proj,0.0000191118,0.05000,1.755 | |
| 35,self_attn.v_proj,0.0000179529,0.05000,1.751 | |
| 35,self_attn.q_proj,0.0001059562,0.05000,1.857 | |
| 35,self_attn.o_proj,0.0000010396,0.05000,1.815 | |
| 35,mlp.gate_proj,0.0001951154,0.05000,2.000 | |
| 35,mlp.up_proj,0.0001831631,0.05000,1.992 | |
| 35,mlp.down_proj,0.0000158026,0.05000,10.654 | |
| 36,self_attn.k_proj,0.0000201484,0.05000,1.778 | |
| 36,self_attn.v_proj,0.0000189599,0.05000,1.774 | |
| 36,self_attn.q_proj,0.0001111809,0.05000,1.842 | |
| 36,self_attn.o_proj,0.0000018594,0.05000,1.806 | |
| 36,mlp.gate_proj,0.0001979247,0.05000,1.987 | |
| 36,mlp.up_proj,0.0001868471,0.05000,2.024 | |
| 36,mlp.down_proj,0.0000156611,0.05000,10.717 | |
| 37,self_attn.k_proj,0.0000191277,0.05000,2.143 | |
| 37,self_attn.v_proj,0.0000170317,0.05000,1.762 | |
| 37,self_attn.q_proj,0.0001037516,0.05000,1.824 | |
| 37,self_attn.o_proj,0.0000016494,0.05000,1.918 | |
| 37,mlp.gate_proj,0.0002023499,0.05000,2.012 | |
| 37,mlp.up_proj,0.0001926919,0.05000,1.967 | |
| 37,mlp.down_proj,0.0000165328,0.05000,10.620 | |
| 38,self_attn.k_proj,0.0000190743,0.05000,1.760 | |
| 38,self_attn.v_proj,0.0000157472,0.05000,1.751 | |
| 38,self_attn.q_proj,0.0001001458,0.05000,1.804 | |
| 38,self_attn.o_proj,0.0000027518,0.05000,1.816 | |
| 38,mlp.gate_proj,0.0002092387,0.05000,2.005 | |
| 38,mlp.up_proj,0.0001991309,0.05000,1.979 | |
| 38,mlp.down_proj,0.0000174658,0.05000,10.616 | |
| 39,self_attn.k_proj,0.0000183438,0.05000,1.797 | |
| 39,self_attn.v_proj,0.0000157707,0.05000,1.786 | |
| 39,self_attn.q_proj,0.0000962149,0.05000,1.829 | |
| 39,self_attn.o_proj,0.0000025272,0.05000,1.819 | |
| 39,mlp.gate_proj,0.0002148854,0.05000,2.003 | |
| 39,mlp.up_proj,0.0002056378,0.05000,1.984 | |
| 39,mlp.down_proj,0.0000188615,0.05000,10.656 | |
| 40,self_attn.k_proj,0.0000182748,0.05000,1.776 | |
| 40,self_attn.v_proj,0.0000128602,0.05000,1.801 | |
| 40,self_attn.q_proj,0.0000945882,0.05000,1.837 | |
| 40,self_attn.o_proj,0.0000040090,0.05000,1.838 | |
| 40,mlp.gate_proj,0.0002224625,0.05000,1.998 | |
| 40,mlp.up_proj,0.0002146541,0.05000,2.031 | |
| 40,mlp.down_proj,0.0000212490,0.05000,10.668 | |
| 41,self_attn.k_proj,0.0000163700,0.05000,1.771 | |
| 41,self_attn.v_proj,0.0000122546,0.05000,1.760 | |
| 41,self_attn.q_proj,0.0000833327,0.05000,1.834 | |
| 41,self_attn.o_proj,0.0000048864,0.05000,1.838 | |
| 41,mlp.gate_proj,0.0002355262,0.05000,1.998 | |
| 41,mlp.up_proj,0.0002269599,0.05000,1.979 | |
| 41,mlp.down_proj,0.0000229579,0.05000,10.677 | |
| 42,self_attn.k_proj,0.0000204834,0.05000,1.763 | |
| 42,self_attn.v_proj,0.0000159663,0.05000,1.760 | |
| 42,self_attn.q_proj,0.0001116346,0.05000,1.817 | |
| 42,self_attn.o_proj,0.0000038089,0.05000,1.806 | |
| 42,mlp.gate_proj,0.0002455023,0.05000,2.074 | |
| 42,mlp.up_proj,0.0002384295,0.05000,1.989 | |
| 42,mlp.down_proj,0.0000260395,0.05000,10.683 | |
| 43,self_attn.k_proj,0.0000201844,0.05000,1.780 | |
| 43,self_attn.v_proj,0.0000141727,0.05000,1.764 | |
| 43,self_attn.q_proj,0.0001068181,0.05000,1.814 | |
| 43,self_attn.o_proj,0.0000052884,0.05000,1.820 | |
| 43,mlp.gate_proj,0.0002542797,0.05000,1.992 | |
| 43,mlp.up_proj,0.0002492644,0.05000,1.983 | |
| 43,mlp.down_proj,0.0000290737,0.05000,10.705 | |
| 44,self_attn.k_proj,0.0000191750,0.05000,1.750 | |
| 44,self_attn.v_proj,0.0000128655,0.05000,1.774 | |
| 44,self_attn.q_proj,0.0001060084,0.05000,1.799 | |
| 44,self_attn.o_proj,0.0000067395,0.05000,1.800 | |
| 44,mlp.gate_proj,0.0002601013,0.05000,1.982 | |
| 44,mlp.up_proj,0.0002597747,0.05000,1.974 | |
| 44,mlp.down_proj,0.0000352207,0.05000,10.593 | |
| 45,self_attn.k_proj,0.0000203800,0.05000,1.776 | |
| 45,self_attn.v_proj,0.0000116344,0.05000,1.754 | |
| 45,self_attn.q_proj,0.0001127626,0.05000,1.810 | |
| 45,self_attn.o_proj,0.0000093858,0.05000,1.806 | |
| 45,mlp.gate_proj,0.0002680701,0.05000,1.988 | |
| 45,mlp.up_proj,0.0002698083,0.05000,1.975 | |
| 45,mlp.down_proj,0.0000560786,0.05000,10.791 | |
| 46,self_attn.k_proj,0.0000223115,0.05000,1.746 | |
| 46,self_attn.v_proj,0.0000130194,0.05000,1.736 | |
| 46,self_attn.q_proj,0.0001210351,0.05000,1.809 | |
| 46,self_attn.o_proj,0.0000144393,0.05000,1.794 | |
| 46,mlp.gate_proj,0.0002725730,0.05000,1.981 | |
| 46,mlp.up_proj,0.0002767919,0.05000,1.957 | |
| 46,mlp.down_proj,0.0000390935,0.05000,10.800 | |
| 47,self_attn.k_proj,0.0000220920,0.05000,1.766 | |
| 47,self_attn.v_proj,0.0000137250,0.05000,1.765 | |
| 47,self_attn.q_proj,0.0001228667,0.05000,2.014 | |
| 47,self_attn.o_proj,0.0000139756,0.05000,1.816 | |
| 47,mlp.gate_proj,0.0002729540,0.05000,2.008 | |
| 47,mlp.up_proj,0.0002807646,0.05000,1.981 | |
| 47,mlp.down_proj,0.0000435434,0.05000,10.649 | |
| 48,self_attn.k_proj,0.0000213162,0.05000,1.763 | |
| 48,self_attn.v_proj,0.0000155181,0.05000,1.758 | |
| 48,self_attn.q_proj,0.0001272095,0.05000,1.812 | |
| 48,self_attn.o_proj,0.0000127778,0.05000,1.836 | |
| 48,mlp.gate_proj,0.0002877861,0.05000,2.007 | |
| 48,mlp.up_proj,0.0002972881,0.05000,1.988 | |
| 48,mlp.down_proj,0.0000485562,0.05000,10.649 | |
| 49,self_attn.k_proj,0.0000211959,0.05000,1.757 | |
| 49,self_attn.v_proj,0.0000150000,0.05000,1.748 | |
| 49,self_attn.q_proj,0.0001207883,0.05000,1.816 | |
| 49,self_attn.o_proj,0.0000144471,0.05000,1.810 | |
| 49,mlp.gate_proj,0.0002878208,0.05000,2.077 | |
| 49,mlp.up_proj,0.0003003240,0.05000,1.973 | |
| 49,mlp.down_proj,0.0000530659,0.05000,10.765 | |
| 50,self_attn.k_proj,0.0000258553,0.05000,1.758 | |
| 50,self_attn.v_proj,0.0000171321,0.05000,1.749 | |
| 50,self_attn.q_proj,0.0001526195,0.05000,1.809 | |
| 50,self_attn.o_proj,0.0000200374,0.05000,1.810 | |
| 50,mlp.gate_proj,0.0002848091,0.05000,2.031 | |
| 50,mlp.up_proj,0.0002997550,0.05000,2.054 | |
| 50,mlp.down_proj,0.0000592731,0.05000,10.671 | |
| 51,self_attn.k_proj,0.0000231560,0.05000,1.778 | |
| 51,self_attn.v_proj,0.0000151993,0.05000,1.752 | |
| 51,self_attn.q_proj,0.0001321706,0.05000,1.818 | |
| 51,self_attn.o_proj,0.0000205501,0.05000,1.809 | |
| 51,mlp.gate_proj,0.0002997619,0.05000,2.003 | |
| 51,mlp.up_proj,0.0003137411,0.05000,1.984 | |
| 51,mlp.down_proj,0.0000643393,0.05000,11.131 | |
| 52,self_attn.k_proj,0.0000203590,0.05000,1.745 | |
| 52,self_attn.v_proj,0.0000186799,0.05000,1.742 | |
| 52,self_attn.q_proj,0.0001251833,0.05000,1.810 | |
| 52,self_attn.o_proj,0.0000231322,0.05000,1.844 | |
| 52,mlp.gate_proj,0.0003448580,0.05000,1.992 | |
| 52,mlp.up_proj,0.0003562837,0.05000,1.984 | |
| 52,mlp.down_proj,0.0000686877,0.05000,11.025 | |
| 53,self_attn.k_proj,0.0000233242,0.05000,1.752 | |
| 53,self_attn.v_proj,0.0000200947,0.05000,1.762 | |
| 53,self_attn.q_proj,0.0001410289,0.05000,1.855 | |
| 53,self_attn.o_proj,0.0000270083,0.05000,1.809 | |
| 53,mlp.gate_proj,0.0003695233,0.05000,2.113 | |
| 53,mlp.up_proj,0.0003783724,0.05000,1.978 | |
| 53,mlp.down_proj,0.0000720811,0.05000,10.649 | |
| 54,self_attn.k_proj,0.0000225596,0.05000,1.765 | |
| 54,self_attn.v_proj,0.0000258560,0.05000,1.752 | |
| 54,self_attn.q_proj,0.0001495487,0.05000,2.181 | |
| 54,self_attn.o_proj,0.0000239377,0.05000,1.814 | |
| 54,mlp.gate_proj,0.0003636169,0.05000,1.974 | |
| 54,mlp.up_proj,0.0003744466,0.05000,1.987 | |
| 54,mlp.down_proj,0.0000797681,0.05000,10.955 | |
| 55,self_attn.k_proj,0.0000218617,0.05000,1.764 | |
| 55,self_attn.v_proj,0.0000253199,0.05000,1.758 | |
| 55,self_attn.q_proj,0.0001466854,0.05000,1.822 | |
| 55,self_attn.o_proj,0.0000282526,0.05000,1.815 | |
| 55,mlp.gate_proj,0.0003757199,0.05000,1.990 | |
| 55,mlp.up_proj,0.0003881287,0.05000,1.987 | |
| 55,mlp.down_proj,0.0000911115,0.05000,10.635 | |
| 56,self_attn.k_proj,0.0000223928,0.05000,1.794 | |
| 56,self_attn.v_proj,0.0000218095,0.05000,1.772 | |
| 56,self_attn.q_proj,0.0001375662,0.05000,1.816 | |
| 56,self_attn.o_proj,0.0000379754,0.05000,1.812 | |
| 56,mlp.gate_proj,0.0004133328,0.05000,2.341 | |
| 56,mlp.up_proj,0.0004231848,0.05000,1.989 | |
| 56,mlp.down_proj,0.0001026907,0.05000,10.732 | |
| 57,self_attn.k_proj,0.0000240502,0.05000,1.773 | |
| 57,self_attn.v_proj,0.0000254070,0.05000,1.769 | |
| 57,self_attn.q_proj,0.0001487034,0.05000,1.813 | |
| 57,self_attn.o_proj,0.0000396974,0.05000,1.844 | |
| 57,mlp.gate_proj,0.0004108658,0.05000,2.431 | |
| 57,mlp.up_proj,0.0004240784,0.05000,2.008 | |
| 57,mlp.down_proj,0.0001128101,0.05000,10.571 | |
| 58,self_attn.k_proj,0.0000219804,0.05000,1.833 | |
| 58,self_attn.v_proj,0.0000258982,0.05000,1.745 | |
| 58,self_attn.q_proj,0.0001463768,0.05000,1.808 | |
| 58,self_attn.o_proj,0.0000463313,0.05000,1.809 | |
| 58,mlp.gate_proj,0.0004239820,0.05000,1.996 | |
| 58,mlp.up_proj,0.0004381811,0.05000,1.988 | |
| 58,mlp.down_proj,0.0001411034,0.05000,10.627 | |
| 59,self_attn.k_proj,0.0000221796,0.05000,1.749 | |
| 59,self_attn.v_proj,0.0000271249,0.05000,1.760 | |
| 59,self_attn.q_proj,0.0001451733,0.05000,1.847 | |
| 59,self_attn.o_proj,0.0000497049,0.05000,1.813 | |
| 59,mlp.gate_proj,0.0004518706,0.05000,2.006 | |
| 59,mlp.up_proj,0.0004566152,0.05000,2.009 | |
| 59,mlp.down_proj,0.0001616510,0.05000,10.726 | |
| 60,self_attn.k_proj,0.0000241346,0.05000,1.740 | |
| 60,self_attn.v_proj,0.0000341904,0.05000,1.735 | |
| 60,self_attn.q_proj,0.0001691093,0.05000,1.811 | |
| 60,self_attn.o_proj,0.0000432857,0.05000,1.815 | |
| 60,mlp.gate_proj,0.0005488024,0.05000,1.983 | |
| 60,mlp.up_proj,0.0005428663,0.05000,1.967 | |
| 60,mlp.down_proj,0.0001826035,0.05000,10.607 | |
| 61,self_attn.k_proj,0.0000247619,0.05000,1.780 | |
| 61,self_attn.v_proj,0.0000374423,0.05000,1.778 | |
| 61,self_attn.q_proj,0.0001707510,0.05000,1.828 | |
| 61,self_attn.o_proj,0.0000489282,0.05000,1.796 | |
| 61,mlp.gate_proj,0.0006036149,0.05000,2.043 | |
| 61,mlp.up_proj,0.0005943566,0.05000,1.986 | |
| 61,mlp.down_proj,0.0002096645,0.05000,10.626 | |
| 62,self_attn.k_proj,0.0000260108,0.05000,1.744 | |
| 62,self_attn.v_proj,0.0000357173,0.05000,1.747 | |
| 62,self_attn.q_proj,0.0001779701,0.05000,1.806 | |
| 62,self_attn.o_proj,0.0000560566,0.05000,1.800 | |
| 62,mlp.gate_proj,0.0007026849,0.05000,1.983 | |
| 62,mlp.up_proj,0.0006780243,0.05000,1.958 | |
| 62,mlp.down_proj,0.0002315546,0.05000,10.636 | |
| 63,self_attn.k_proj,0.0000259721,0.05000,1.775 | |
| 63,self_attn.v_proj,0.0000370121,0.05000,1.768 | |
| 63,self_attn.q_proj,0.0001751592,0.05000,1.833 | |
| 63,self_attn.o_proj,0.0000582709,0.05000,1.794 | |
| 63,mlp.gate_proj,0.0007427418,0.05000,2.061 | |
| 63,mlp.up_proj,0.0007230977,0.05000,1.987 | |
| 63,mlp.down_proj,0.0002685315,0.05000,10.627 | |
| 64,self_attn.k_proj,0.0000277544,0.05000,1.773 | |
| 64,self_attn.v_proj,0.0000370765,0.05000,1.817 | |
| 64,self_attn.q_proj,0.0001851113,0.05000,1.824 | |
| 64,self_attn.o_proj,0.0000561820,0.05000,1.813 | |
| 64,mlp.gate_proj,0.0008117926,0.05000,1.997 | |
| 64,mlp.up_proj,0.0007852368,0.05000,1.984 | |
| 64,mlp.down_proj,0.0003075914,0.05000,10.902 | |
| 65,self_attn.k_proj,0.0000285461,0.05000,1.787 | |
| 65,self_attn.v_proj,0.0000393212,0.05000,1.763 | |
| 65,self_attn.q_proj,0.0001911329,0.05000,1.814 | |
| 65,self_attn.o_proj,0.0000612525,0.05000,1.806 | |
| 65,mlp.gate_proj,0.0009011056,0.05000,1.996 | |
| 65,mlp.up_proj,0.0008748247,0.05000,1.984 | |
| 65,mlp.down_proj,0.0003410627,0.05000,10.640 | |
| 66,self_attn.k_proj,0.0000250020,0.05000,1.769 | |
| 66,self_attn.v_proj,0.0000412053,0.05000,1.804 | |
| 66,self_attn.q_proj,0.0001777558,0.05000,1.822 | |
| 66,self_attn.o_proj,0.0000593562,0.05000,1.806 | |
| 66,mlp.gate_proj,0.0010464112,0.05000,1.991 | |
| 66,mlp.up_proj,0.0010015315,0.05000,1.975 | |
| 66,mlp.down_proj,0.0003793334,0.05000,10.629 | |
| 67,self_attn.k_proj,0.0000271901,0.05000,1.769 | |
| 67,self_attn.v_proj,0.0000476565,0.05000,1.783 | |
| 67,self_attn.q_proj,0.0001915081,0.05000,1.825 | |
| 67,self_attn.o_proj,0.0000432816,0.05000,1.820 | |
| 67,mlp.gate_proj,0.0011060469,0.05000,2.151 | |
| 67,mlp.up_proj,0.0010709054,0.05000,1.993 | |
| 67,mlp.down_proj,0.0004122393,0.05000,10.675 | |
| 68,self_attn.k_proj,0.0000280968,0.05000,1.749 | |
| 68,self_attn.v_proj,0.0000545287,0.05000,1.744 | |
| 68,self_attn.q_proj,0.0002037208,0.05000,1.818 | |
| 68,self_attn.o_proj,0.0000551032,0.05000,1.805 | |
| 68,mlp.gate_proj,0.0011910696,0.05000,2.007 | |
| 68,mlp.up_proj,0.0011660263,0.05000,2.002 | |
| 68,mlp.down_proj,0.0004548276,0.05000,10.648 | |
| 69,self_attn.k_proj,0.0000288387,0.05000,1.752 | |
| 69,self_attn.v_proj,0.0000463445,0.05000,1.772 | |
| 69,self_attn.q_proj,0.0001985468,0.05000,1.822 | |
| 69,self_attn.o_proj,0.0000651683,0.05000,1.812 | |
| 69,mlp.gate_proj,0.0012707321,0.05000,2.017 | |
| 69,mlp.up_proj,0.0012687438,0.05000,1.987 | |
| 69,mlp.down_proj,0.0005535664,0.05000,10.638 | |
| 70,self_attn.k_proj,0.0000278806,0.05000,1.833 | |
| 70,self_attn.v_proj,0.0000634856,0.05000,1.766 | |
| 70,self_attn.q_proj,0.0002063552,0.05000,1.824 | |
| 70,self_attn.o_proj,0.0000850229,0.05000,1.822 | |
| 70,mlp.gate_proj,0.0014331741,0.05000,2.091 | |
| 70,mlp.up_proj,0.0014520215,0.05000,1.987 | |
| 70,mlp.down_proj,0.0006782743,0.05000,10.642 | |
| 71,self_attn.k_proj,0.0000291759,0.05000,1.771 | |
| 71,self_attn.v_proj,0.0000665733,0.05000,1.748 | |
| 71,self_attn.q_proj,0.0002151191,0.05000,1.818 | |
| 71,self_attn.o_proj,0.0000977527,0.05000,1.800 | |
| 71,mlp.gate_proj,0.0015705100,0.05000,2.357 | |
| 71,mlp.up_proj,0.0016157514,0.05000,1.970 | |
| 71,mlp.down_proj,0.0008346530,0.05000,10.610 | |
| 72,self_attn.k_proj,0.0000277748,0.05000,1.781 | |
| 72,self_attn.v_proj,0.0000769196,0.05000,1.770 | |
| 72,self_attn.q_proj,0.0002174281,0.05000,1.811 | |
| 72,self_attn.o_proj,0.0000868489,0.05000,1.822 | |
| 72,mlp.gate_proj,0.0017338871,0.05000,2.008 | |
| 72,mlp.up_proj,0.0018062971,0.05000,2.012 | |
| 72,mlp.down_proj,0.0010927289,0.05000,10.713 | |
| 73,self_attn.k_proj,0.0000286837,0.05000,1.855 | |
| 73,self_attn.v_proj,0.0000898291,0.05000,1.765 | |
| 73,self_attn.q_proj,0.0002256701,0.05000,1.823 | |
| 73,self_attn.o_proj,0.0001178069,0.05000,1.812 | |
| 73,mlp.gate_proj,0.0018677687,0.05000,2.000 | |
| 73,mlp.up_proj,0.0019719667,0.05000,1.974 | |
| 73,mlp.down_proj,0.0013667705,0.05000,10.622 | |
| 74,self_attn.k_proj,0.0000291870,0.05000,1.782 | |
| 74,self_attn.v_proj,0.0000854093,0.05000,1.765 | |
| 74,self_attn.q_proj,0.0002426886,0.05000,1.822 | |
| 74,self_attn.o_proj,0.0001362484,0.05000,1.820 | |
| 74,mlp.gate_proj,0.0019655873,0.05000,1.998 | |
| 74,mlp.up_proj,0.0021086635,0.05000,1.984 | |
| 74,mlp.down_proj,0.0018890411,0.05000,10.693 | |
| 75,self_attn.k_proj,0.0000286997,0.05000,1.761 | |
| 75,self_attn.v_proj,0.0001000469,0.05000,1.738 | |
| 75,self_attn.q_proj,0.0002336207,0.05000,1.786 | |
| 75,self_attn.o_proj,0.0001834656,0.05000,1.802 | |
| 75,mlp.gate_proj,0.0021311569,0.05000,1.993 | |
| 75,mlp.up_proj,0.0023135146,0.05000,2.004 | |
| 75,mlp.down_proj,0.0029731325,0.05000,10.627 | |
| 76,self_attn.k_proj,0.0000291649,0.05000,1.759 | |
| 76,self_attn.v_proj,0.0001630616,0.05000,1.747 | |
| 76,self_attn.q_proj,0.0002645282,0.05000,1.796 | |
| 76,self_attn.o_proj,0.0002224826,0.05000,1.891 | |
| 76,mlp.gate_proj,0.0022946957,0.05000,2.193 | |
| 76,mlp.up_proj,0.0025133457,0.05000,1.982 | |
| 76,mlp.down_proj,0.0047117417,0.05000,10.648 | |
| 77,self_attn.k_proj,0.0000274915,0.05000,1.782 | |
| 77,self_attn.v_proj,0.0001038129,0.05000,1.765 | |
| 77,self_attn.q_proj,0.0002454595,0.05000,1.843 | |
| 77,self_attn.o_proj,0.0003246888,0.05000,1.824 | |
| 77,mlp.gate_proj,0.0024383952,0.05000,2.030 | |
| 77,mlp.up_proj,0.0026753585,0.05000,1.995 | |
| 77,mlp.down_proj,0.0054391157,0.05000,10.677 | |
| 78,self_attn.k_proj,0.0000255497,0.05000,1.753 | |
| 78,self_attn.v_proj,0.0001116223,0.05000,1.773 | |
| 78,self_attn.q_proj,0.0002304750,0.05000,1.823 | |
| 78,self_attn.o_proj,0.0003565016,0.05000,1.820 | |
| 78,mlp.gate_proj,0.0022525496,0.05000,1.985 | |
| 78,mlp.up_proj,0.0024347074,0.05000,1.993 | |
| 78,mlp.down_proj,0.0097805633,0.05000,10.660 | |
| 79,self_attn.k_proj,0.0000219384,0.05000,1.772 | |
| 79,self_attn.v_proj,0.0000395143,0.05000,1.750 | |
| 79,self_attn.q_proj,0.0001646463,0.05000,1.812 | |
| 79,self_attn.o_proj,0.0001054719,0.05000,1.787 | |
| 79,mlp.gate_proj,0.0021020814,0.05000,2.001 | |
| 79,mlp.up_proj,0.0022070014,0.05000,2.006 | |
| 79,mlp.down_proj,0.0153322140,0.05000,10.670 | |