| layer,module,loss,samples,damp,time | |
| 0,self_attn.k_proj,0.0000432854,0.05000,1.766 | |
| 0,self_attn.v_proj,0.0000049972,0.05000,1.793 | |
| 0,self_attn.q_proj,0.0001757931,0.05000,1.798 | |
| 0,self_attn.o_proj,0.0000108898,0.05000,0.778 | |
| 0,mlp.up_proj,0.0003301854,0.05000,1.146 | |
| 0,mlp.gate_proj,0.0007666261,0.05000,1.183 | |
| 0,mlp.down_proj,0.0000141513,0.05000,5.336 | |
| 1,self_attn.k_proj,0.0000358306,0.05000,1.767 | |
| 1,self_attn.q_proj,0.0001356997,0.05000,1.789 | |
| 1,self_attn.v_proj,0.0000092715,0.05000,1.792 | |
| 1,self_attn.o_proj,0.0000043125,0.05000,0.785 | |
| 1,mlp.up_proj,0.0068297327,0.05000,1.161 | |
| 1,mlp.gate_proj,0.0110956548,0.05000,1.184 | |
| 1,mlp.down_proj,0.0000095164,0.05000,5.333 | |
| 2,self_attn.k_proj,0.0000858678,0.05000,1.750 | |
| 2,self_attn.v_proj,0.0000151014,0.05000,1.786 | |
| 2,self_attn.q_proj,0.0003180285,0.05000,1.790 | |
| 2,self_attn.o_proj,0.0000078531,0.05000,0.777 | |
| 2,mlp.up_proj,0.0060570274,0.05000,1.143 | |
| 2,mlp.gate_proj,0.0098869666,0.05000,1.177 | |
| 2,mlp.down_proj,0.0000373999,0.05000,5.348 | |
| 3,self_attn.k_proj,0.0000810958,0.05000,1.771 | |
| 3,self_attn.q_proj,0.0003177889,0.05000,1.790 | |
| 3,self_attn.v_proj,0.0000203367,0.05000,1.792 | |
| 3,self_attn.o_proj,0.0000193827,0.05000,0.780 | |
| 3,mlp.up_proj,0.0127348766,0.05000,1.154 | |
| 3,mlp.gate_proj,0.0171400174,0.05000,1.185 | |
| 3,mlp.down_proj,0.0021732034,0.05000,5.357 | |
| 4,self_attn.k_proj,0.0001399196,0.05000,1.776 | |
| 4,self_attn.q_proj,0.0006156289,0.05000,1.794 | |
| 4,self_attn.v_proj,0.0000480736,0.05000,1.796 | |
| 4,self_attn.o_proj,0.0000394140,0.05000,0.788 | |
| 4,mlp.up_proj,0.0090971480,0.05000,1.153 | |
| 4,mlp.gate_proj,0.0135318746,0.05000,1.185 | |
| 4,mlp.down_proj,0.0023862841,0.05000,5.319 | |
| 5,self_attn.k_proj,0.0001325996,0.05000,1.784 | |
| 5,self_attn.q_proj,0.0006572159,0.05000,1.797 | |
| 5,self_attn.v_proj,0.0000548861,0.05000,1.799 | |
| 5,self_attn.o_proj,0.0000599871,0.05000,0.795 | |
| 5,mlp.up_proj,0.0147371594,0.05000,1.171 | |
| 5,mlp.gate_proj,0.0186996124,0.05000,1.195 | |
| 5,mlp.down_proj,0.0002437168,0.05000,5.403 | |
| 6,self_attn.k_proj,0.0000885772,0.05000,1.742 | |
| 6,self_attn.v_proj,0.0000421790,0.05000,1.777 | |
| 6,self_attn.q_proj,0.0004314109,0.05000,1.783 | |
| 6,self_attn.o_proj,0.0000446818,0.05000,0.794 | |
| 6,mlp.up_proj,0.0026338197,0.05000,1.157 | |
| 6,mlp.gate_proj,0.0037542884,0.05000,1.188 | |
| 6,mlp.down_proj,0.0000997583,0.05000,5.390 | |
| 7,self_attn.k_proj,0.0000925571,0.05000,1.789 | |
| 7,self_attn.q_proj,0.0005228582,0.05000,1.802 | |
| 7,self_attn.v_proj,0.0000846739,0.05000,1.804 | |
| 7,self_attn.o_proj,0.0000540034,0.05000,0.791 | |
| 7,mlp.up_proj,0.0021272203,0.05000,1.164 | |
| 7,mlp.gate_proj,0.0023616219,0.05000,1.187 | |
| 7,mlp.down_proj,0.0001141313,0.05000,5.314 | |
| 8,self_attn.k_proj,0.0001738771,0.05000,1.777 | |
| 8,self_attn.v_proj,0.0000707547,0.05000,1.794 | |
| 8,self_attn.q_proj,0.0007570342,0.05000,1.799 | |
| 8,self_attn.o_proj,0.0000702879,0.05000,0.788 | |
| 8,mlp.up_proj,0.0023392382,0.05000,1.160 | |
| 8,mlp.gate_proj,0.0024381351,0.05000,1.184 | |
| 8,mlp.down_proj,0.0001141036,0.05000,5.359 | |
| 9,self_attn.k_proj,0.0001255440,0.05000,1.747 | |
| 9,self_attn.v_proj,0.0001075853,0.05000,1.781 | |
| 9,self_attn.q_proj,0.0006896859,0.05000,1.785 | |
| 9,self_attn.o_proj,0.0000752609,0.05000,0.778 | |
| 9,mlp.up_proj,0.0046194003,0.05000,1.152 | |
| 9,mlp.gate_proj,0.0072552940,0.05000,1.185 | |
| 9,mlp.down_proj,0.0001435438,0.05000,5.375 | |
| 10,self_attn.v_proj,0.0000711022,0.05000,1.815 | |
| 10,self_attn.k_proj,0.0001285309,0.05000,1.819 | |
| 10,self_attn.q_proj,0.0006438414,0.05000,1.842 | |
| 10,self_attn.o_proj,0.0000531726,0.05000,0.780 | |
| 10,mlp.up_proj,0.0023653700,0.05000,1.150 | |
| 10,mlp.gate_proj,0.0026815632,0.05000,1.183 | |
| 10,mlp.down_proj,0.0000887731,0.05000,5.373 | |
| 11,self_attn.k_proj,0.0001696957,0.05000,1.778 | |
| 11,self_attn.v_proj,0.0000648065,0.05000,1.797 | |
| 11,self_attn.q_proj,0.0007402942,0.05000,1.801 | |
| 11,self_attn.o_proj,0.0000742858,0.05000,0.783 | |
| 11,mlp.up_proj,0.0021493328,0.05000,1.163 | |
| 11,mlp.gate_proj,0.0022600763,0.05000,1.190 | |
| 11,mlp.down_proj,0.0002429208,0.05000,5.360 | |
| 12,self_attn.k_proj,0.0001913924,0.05000,1.775 | |
| 12,self_attn.v_proj,0.0000848261,0.05000,1.794 | |
| 12,self_attn.q_proj,0.0008414217,0.05000,1.799 | |
| 12,self_attn.o_proj,0.0000603520,0.05000,0.791 | |
| 12,mlp.up_proj,0.0021892047,0.05000,1.165 | |
| 12,mlp.gate_proj,0.0021619192,0.05000,1.188 | |
| 12,mlp.down_proj,0.0000992026,0.05000,5.388 | |
| 13,self_attn.k_proj,0.0001764100,0.05000,1.783 | |
| 13,self_attn.v_proj,0.0001123422,0.05000,1.800 | |
| 13,self_attn.q_proj,0.0009153854,0.05000,1.803 | |
| 13,self_attn.o_proj,0.0000794259,0.05000,0.789 | |
| 13,mlp.up_proj,0.0022109749,0.05000,1.161 | |
| 13,mlp.gate_proj,0.0023554429,0.05000,1.187 | |
| 13,mlp.down_proj,0.0000893284,0.05000,5.370 | |
| 14,self_attn.k_proj,0.0002561925,0.05000,1.782 | |
| 14,self_attn.v_proj,0.0001154645,0.05000,1.787 | |
| 14,self_attn.q_proj,0.0013007666,0.05000,1.813 | |
| 14,self_attn.o_proj,0.0001204233,0.05000,0.781 | |
| 14,mlp.up_proj,0.0025638388,0.05000,1.145 | |
| 14,mlp.gate_proj,0.0025896619,0.05000,1.171 | |
| 14,mlp.down_proj,0.0000961390,0.05000,5.339 | |
| 15,self_attn.k_proj,0.0002411058,0.05000,1.771 | |
| 15,self_attn.v_proj,0.0001010086,0.05000,1.779 | |
| 15,self_attn.q_proj,0.0010763963,0.05000,1.806 | |
| 15,self_attn.o_proj,0.0001248457,0.05000,0.779 | |
| 15,mlp.up_proj,0.0025943129,0.05000,1.146 | |
| 15,mlp.gate_proj,0.0025343251,0.05000,1.173 | |
| 15,mlp.down_proj,0.0001141996,0.05000,5.327 | |
| 16,self_attn.k_proj,0.0002437389,0.05000,1.762 | |
| 16,self_attn.v_proj,0.0001444091,0.05000,1.778 | |
| 16,self_attn.q_proj,0.0012326450,0.05000,1.798 | |
| 16,self_attn.o_proj,0.0001986508,0.05000,0.780 | |
| 16,mlp.up_proj,0.0028457921,0.05000,1.147 | |
| 16,mlp.gate_proj,0.0027699758,0.05000,1.172 | |
| 16,mlp.down_proj,0.0001097131,0.05000,5.343 | |
| 17,self_attn.k_proj,0.0002372200,0.05000,1.779 | |
| 17,self_attn.v_proj,0.0001644637,0.05000,1.785 | |
| 17,self_attn.q_proj,0.0013344949,0.05000,1.804 | |
| 17,self_attn.o_proj,0.0001687157,0.05000,0.777 | |
| 17,mlp.up_proj,0.0034605139,0.05000,1.152 | |
| 17,mlp.gate_proj,0.0032823749,0.05000,1.177 | |
| 17,mlp.down_proj,0.0001509321,0.05000,5.323 | |
| 18,self_attn.k_proj,0.0001887011,0.05000,1.765 | |
| 18,self_attn.v_proj,0.0001808350,0.05000,1.779 | |
| 18,self_attn.q_proj,0.0010705749,0.05000,1.801 | |
| 18,self_attn.o_proj,0.0001657871,0.05000,0.783 | |
| 18,mlp.up_proj,0.0040642183,0.05000,1.148 | |
| 18,mlp.gate_proj,0.0037679110,0.05000,1.174 | |
| 18,mlp.down_proj,0.0002181015,0.05000,5.336 | |
| 19,self_attn.k_proj,0.0002055513,0.05000,1.769 | |
| 19,self_attn.v_proj,0.0002454614,0.05000,1.785 | |
| 19,self_attn.q_proj,0.0013781268,0.05000,1.805 | |
| 19,self_attn.o_proj,0.0002243668,0.05000,0.781 | |
| 19,mlp.up_proj,0.0046072615,0.05000,1.154 | |
| 19,mlp.gate_proj,0.0044774732,0.05000,1.177 | |
| 19,mlp.down_proj,0.0002187767,0.05000,5.333 | |
| 20,self_attn.k_proj,0.0002085851,0.05000,1.772 | |
| 20,self_attn.v_proj,0.0002610162,0.05000,1.786 | |
| 20,self_attn.q_proj,0.0013019970,0.05000,1.806 | |
| 20,self_attn.o_proj,0.0001514216,0.05000,0.781 | |
| 20,mlp.up_proj,0.0054252240,0.05000,1.148 | |
| 20,mlp.gate_proj,0.0051634870,0.05000,1.173 | |
| 20,mlp.down_proj,0.0003712054,0.05000,5.326 | |
| 21,self_attn.k_proj,0.0002118031,0.05000,1.759 | |
| 21,self_attn.v_proj,0.0003764736,0.05000,1.772 | |
| 21,self_attn.q_proj,0.0015059532,0.05000,1.788 | |
| 21,self_attn.o_proj,0.0004255283,0.05000,0.782 | |
| 21,mlp.up_proj,0.0066461328,0.05000,1.147 | |
| 21,mlp.gate_proj,0.0066254139,0.05000,1.174 | |
| 21,mlp.down_proj,0.0005992475,0.05000,5.317 | |
| 22,self_attn.k_proj,0.0002988659,0.05000,1.769 | |
| 22,self_attn.v_proj,0.0005736383,0.05000,1.783 | |
| 22,self_attn.q_proj,0.0021297575,0.05000,1.807 | |
| 22,self_attn.o_proj,0.0004206545,0.05000,0.780 | |
| 22,mlp.up_proj,0.0094454406,0.05000,1.151 | |
| 22,mlp.gate_proj,0.0092535556,0.05000,1.175 | |
| 22,mlp.down_proj,0.0008095826,0.05000,5.324 | |
| 23,self_attn.k_proj,0.0003835323,0.05000,1.771 | |
| 23,self_attn.v_proj,0.0007766295,0.05000,1.785 | |
| 23,self_attn.q_proj,0.0024568439,0.05000,1.806 | |
| 23,self_attn.o_proj,0.0008100346,0.05000,0.780 | |
| 23,mlp.up_proj,0.0125601661,0.05000,1.148 | |
| 23,mlp.gate_proj,0.0126166713,0.05000,1.174 | |
| 23,mlp.down_proj,0.0009607696,0.05000,5.323 | |
| 24,self_attn.k_proj,0.0003131202,0.05000,1.760 | |
| 24,self_attn.v_proj,0.0008387528,0.05000,1.777 | |
| 24,self_attn.q_proj,0.0022884397,0.05000,1.799 | |
| 24,self_attn.o_proj,0.0006900308,0.05000,0.784 | |
| 24,mlp.up_proj,0.0137791785,0.05000,1.152 | |
| 24,mlp.gate_proj,0.0128174114,0.05000,1.177 | |
| 24,mlp.down_proj,0.0013900608,0.05000,5.345 | |
| 25,self_attn.k_proj,0.0003696309,0.05000,1.796 | |
| 25,self_attn.v_proj,0.0014799064,0.05000,1.798 | |
| 25,self_attn.q_proj,0.0027035042,0.05000,1.818 | |
| 25,self_attn.o_proj,0.0010714627,0.05000,0.780 | |
| 25,mlp.up_proj,0.0188588492,0.05000,1.149 | |
| 25,mlp.gate_proj,0.0167194957,0.05000,1.181 | |
| 25,mlp.down_proj,0.0112290785,0.05000,5.347 | |
| 26,self_attn.k_proj,0.0005632932,0.05000,1.775 | |
| 26,self_attn.v_proj,0.0039053194,0.05000,1.784 | |
| 26,self_attn.q_proj,0.0044603734,0.05000,1.806 | |
| 26,self_attn.o_proj,0.0024405535,0.05000,0.786 | |
| 26,mlp.up_proj,0.0201260808,0.05000,1.157 | |
| 26,mlp.gate_proj,0.0176544122,0.05000,1.180 | |
| 26,mlp.down_proj,0.0254254744,0.05000,5.332 | |
| 27,self_attn.k_proj,0.0007584638,0.05000,1.767 | |
| 27,self_attn.v_proj,0.0063212753,0.05000,1.781 | |
| 27,self_attn.q_proj,0.0070051274,0.05000,1.795 | |
| 27,self_attn.o_proj,0.0045859847,0.05000,0.785 | |
| 27,mlp.up_proj,0.0242716040,0.05000,1.155 | |
| 27,mlp.gate_proj,0.0231725800,0.05000,1.181 | |
| 27,mlp.down_proj,0.0212887442,0.05000,5.341 | |