| layer,module,loss,samples,damp,time | |
| 0,self_attn.k_proj,0.0000001286,0.05000,0.569 | |
| 0,self_attn.q_proj,0.0000002646,0.05000,0.475 | |
| 0,self_attn.v_proj,0.0000001136,0.05000,9.847 | |
| 0,self_attn.o_proj,0.0000003787,0.05000,0.208 | |
| 0,mlp.gate_proj,0.0000030995,0.05000,0.433 | |
| 0,mlp.up_proj,0.0000020126,0.05000,9.667 | |
| 0,mlp.down_proj,0.0000005277,0.05000,0.688 | |
| 1,self_attn.k_proj,0.0000000902,0.05000,0.378 | |
| 1,self_attn.q_proj,0.0000001889,0.05000,0.430 | |
| 1,self_attn.v_proj,0.0000000910,0.05000,9.661 | |
| 1,self_attn.o_proj,0.0000001557,0.05000,0.216 | |
| 1,mlp.gate_proj,0.0000554367,0.05000,0.393 | |
| 1,mlp.up_proj,0.0000223800,0.05000,9.681 | |
| 1,mlp.down_proj,0.0000009195,0.05000,0.664 | |
| 2,self_attn.k_proj,0.0000001894,0.05000,0.415 | |
| 2,self_attn.q_proj,0.0000004174,0.05000,0.487 | |
| 2,self_attn.v_proj,0.0000001915,0.05000,8.161 | |
| 2,self_attn.o_proj,0.0000002722,0.05000,0.207 | |
| 2,mlp.gate_proj,0.0000472408,0.05000,0.393 | |
| 2,mlp.up_proj,0.0000191339,0.05000,9.683 | |
| 2,mlp.down_proj,0.0099027801,0.05000,0.647 | |
| 3,self_attn.k_proj,0.0000014196,0.05000,0.393 | |
| 3,self_attn.q_proj,0.0000028513,0.05000,0.445 | |
| 3,self_attn.v_proj,0.0000014696,0.05000,9.661 | |
| 3,self_attn.o_proj,0.0000005255,0.05000,0.212 | |
| 3,mlp.gate_proj,0.0000556838,0.05000,0.403 | |
| 3,mlp.up_proj,0.0000240990,0.05000,8.305 | |
| 3,mlp.down_proj,0.0000016354,0.05000,0.651 | |
| 4,self_attn.k_proj,0.0000013536,0.05000,0.406 | |
| 4,self_attn.q_proj,0.0000028432,0.05000,0.422 | |
| 4,self_attn.v_proj,0.0000015019,0.05000,9.641 | |
| 4,self_attn.o_proj,0.0000009051,0.05000,0.217 | |
| 4,mlp.gate_proj,0.0000505280,0.05000,0.420 | |
| 4,mlp.up_proj,0.0000238862,0.05000,9.680 | |
| 4,mlp.down_proj,0.0000022756,0.05000,0.656 | |
| 5,self_attn.k_proj,0.0000018439,0.05000,0.416 | |
| 5,self_attn.q_proj,0.0000041231,0.05000,0.428 | |
| 5,self_attn.v_proj,0.0000020115,0.05000,9.656 | |
| 5,self_attn.o_proj,0.0000011567,0.05000,0.217 | |
| 5,mlp.gate_proj,0.0000228395,0.05000,0.449 | |
| 5,mlp.up_proj,0.0000156479,0.05000,9.683 | |
| 5,mlp.down_proj,0.0000032556,0.05000,0.653 | |
| 6,self_attn.k_proj,0.0000016667,0.05000,0.392 | |
| 6,self_attn.q_proj,0.0000034560,0.05000,0.464 | |
| 6,self_attn.v_proj,0.0000016042,0.05000,8.174 | |
| 6,self_attn.o_proj,0.0000013321,0.05000,0.208 | |
| 6,mlp.gate_proj,0.0000317576,0.05000,0.424 | |
| 6,mlp.up_proj,0.0000222448,0.05000,9.677 | |
| 6,mlp.down_proj,0.0000047190,0.05000,0.651 | |
| 7,self_attn.k_proj,0.0000034871,0.05000,0.409 | |
| 7,self_attn.q_proj,0.0000079519,0.05000,0.418 | |
| 7,self_attn.v_proj,0.0000039857,0.05000,9.642 | |
| 7,self_attn.o_proj,0.0000019424,0.05000,0.212 | |
| 7,mlp.gate_proj,0.0000451046,0.05000,0.392 | |
| 7,mlp.up_proj,0.0000298035,0.05000,8.257 | |
| 7,mlp.down_proj,0.0000054742,0.05000,0.653 | |
| 8,self_attn.k_proj,0.0000048507,0.05000,0.388 | |
| 8,self_attn.q_proj,0.0000100572,0.05000,0.422 | |
| 8,self_attn.v_proj,0.0000045682,0.05000,9.650 | |
| 8,self_attn.o_proj,0.0000016871,0.05000,0.212 | |
| 8,mlp.gate_proj,0.0000407348,0.05000,0.412 | |
| 8,mlp.up_proj,0.0000301114,0.05000,9.659 | |
| 8,mlp.down_proj,0.0000070363,0.05000,0.652 | |
| 9,self_attn.k_proj,0.0000098412,0.05000,0.387 | |
| 9,self_attn.q_proj,0.0000214254,0.05000,0.426 | |
| 9,self_attn.v_proj,0.0000094100,0.05000,9.654 | |
| 9,self_attn.o_proj,0.0000050124,0.05000,0.213 | |
| 9,mlp.gate_proj,0.0000392365,0.05000,0.422 | |
| 9,mlp.up_proj,0.0000317824,0.05000,9.680 | |
| 9,mlp.down_proj,0.0000100710,0.05000,0.650 | |
| 10,self_attn.k_proj,0.0000077404,0.05000,0.381 | |
| 10,self_attn.q_proj,0.0000169567,0.05000,0.419 | |
| 10,self_attn.v_proj,0.0000080448,0.05000,8.179 | |
| 10,self_attn.o_proj,0.0000045071,0.05000,0.207 | |
| 10,mlp.gate_proj,0.0000393384,0.05000,0.434 | |
| 10,mlp.up_proj,0.0000329698,0.05000,9.667 | |
| 10,mlp.down_proj,0.0000156726,0.05000,0.665 | |
| 11,self_attn.k_proj,0.0000159419,0.05000,0.388 | |
| 11,self_attn.q_proj,0.0000354457,0.05000,0.413 | |
| 11,self_attn.v_proj,0.0000139918,0.05000,9.658 | |
| 11,self_attn.o_proj,0.0000126698,0.05000,0.210 | |
| 11,mlp.gate_proj,0.0000352747,0.05000,0.440 | |
| 11,mlp.up_proj,0.0000340574,0.05000,8.291 | |
| 11,mlp.down_proj,0.0000195205,0.05000,0.649 | |
| 12,self_attn.k_proj,0.0000159710,0.05000,0.384 | |
| 12,self_attn.q_proj,0.0000356597,0.05000,0.429 | |
| 12,self_attn.v_proj,0.0000159614,0.05000,9.662 | |
| 12,self_attn.o_proj,0.0000078580,0.05000,0.212 | |
| 12,mlp.gate_proj,0.0000364643,0.05000,0.406 | |
| 12,mlp.up_proj,0.0000370203,0.05000,9.680 | |
| 12,mlp.down_proj,0.0000224948,0.05000,0.655 | |
| 13,self_attn.k_proj,0.0000212178,0.05000,0.393 | |
| 13,self_attn.q_proj,0.0000546827,0.05000,0.444 | |
| 13,self_attn.v_proj,0.0000230411,0.05000,9.652 | |
| 13,self_attn.o_proj,0.0000118011,0.05000,0.213 | |
| 13,mlp.gate_proj,0.0000409560,0.05000,0.412 | |
| 13,mlp.up_proj,0.0000416904,0.05000,9.670 | |
| 13,mlp.down_proj,0.0000318613,0.05000,0.654 | |
| 14,self_attn.k_proj,0.0000363028,0.05000,0.446 | |
| 14,self_attn.q_proj,0.0000869382,0.05000,0.423 | |
| 14,self_attn.v_proj,0.0000376178,0.05000,8.239 | |
| 14,self_attn.o_proj,0.0000167371,0.05000,0.206 | |
| 14,mlp.gate_proj,0.0000454664,0.05000,0.443 | |
| 14,mlp.up_proj,0.0000474814,0.05000,9.673 | |
| 14,mlp.down_proj,0.0000445586,0.05000,0.650 | |
| 15,self_attn.k_proj,0.0000688017,0.05000,0.447 | |
| 15,self_attn.q_proj,0.0001997899,0.05000,0.497 | |
| 15,self_attn.v_proj,0.0000827729,0.05000,9.652 | |
| 15,self_attn.o_proj,0.0000320234,0.05000,0.214 | |
| 15,mlp.gate_proj,0.0000528398,0.05000,0.455 | |
| 15,mlp.up_proj,0.0000566378,0.05000,8.255 | |
| 15,mlp.down_proj,0.0000653121,0.05000,0.649 | |
| 16,self_attn.k_proj,0.0001001867,0.05000,0.429 | |
| 16,self_attn.q_proj,0.0002616168,0.05000,0.451 | |
| 16,self_attn.v_proj,0.0000959632,0.05000,9.640 | |
| 16,self_attn.o_proj,0.0000444373,0.05000,0.211 | |
| 16,mlp.gate_proj,0.0000633158,0.05000,0.443 | |
| 16,mlp.up_proj,0.0000730107,0.05000,9.669 | |
| 16,mlp.down_proj,0.0001600736,0.05000,0.649 | |
| 17,self_attn.k_proj,0.0002788753,0.05000,0.421 | |
| 17,self_attn.q_proj,0.0007597560,0.05000,0.434 | |
| 17,self_attn.v_proj,0.0003315294,0.05000,9.658 | |
| 17,self_attn.o_proj,0.0001125035,0.05000,0.214 | |
| 17,mlp.gate_proj,0.0000975621,0.05000,0.409 | |
| 17,mlp.up_proj,0.0001136578,0.05000,9.672 | |
| 17,mlp.down_proj,0.0002273930,0.05000,0.653 | |
| 18,self_attn.k_proj,0.0002986319,0.05000,0.443 | |
| 18,self_attn.q_proj,0.0008368891,0.05000,0.437 | |
| 18,self_attn.v_proj,0.0003074740,0.05000,8.188 | |
| 18,self_attn.o_proj,0.0000965470,0.05000,0.207 | |
| 18,mlp.gate_proj,0.0001294523,0.05000,0.396 | |
| 18,mlp.up_proj,0.0001504320,0.05000,9.665 | |
| 18,mlp.down_proj,0.0004062122,0.05000,0.657 | |
| 19,self_attn.k_proj,0.0005055367,0.05000,0.408 | |
| 19,self_attn.q_proj,0.0014725006,0.05000,0.417 | |
| 19,self_attn.v_proj,0.0005765656,0.05000,9.634 | |
| 19,self_attn.o_proj,0.0002112224,0.05000,0.212 | |
| 19,mlp.gate_proj,0.0001672620,0.05000,0.420 | |
| 19,mlp.up_proj,0.0002034081,0.05000,7.917 | |
| 19,mlp.down_proj,0.0007933816,0.05000,0.659 | |
| 20,self_attn.k_proj,0.0008494559,0.05000,0.398 | |
| 20,self_attn.q_proj,0.0023191713,0.05000,0.433 | |
| 20,self_attn.v_proj,0.0009429085,0.05000,9.647 | |
| 20,self_attn.o_proj,0.0003886604,0.05000,0.210 | |
| 20,mlp.gate_proj,0.0002268225,0.05000,0.415 | |
| 20,mlp.up_proj,0.0002673458,0.05000,9.676 | |
| 20,mlp.down_proj,0.0010970989,0.05000,0.652 | |
| 21,self_attn.k_proj,0.0013209661,0.05000,0.463 | |
| 21,self_attn.q_proj,0.0033686485,0.05000,0.538 | |
| 21,self_attn.v_proj,0.0015625238,0.05000,9.667 | |
| 21,self_attn.o_proj,0.0004073506,0.05000,0.210 | |
| 21,mlp.gate_proj,0.0002858517,0.05000,0.411 | |
| 21,mlp.up_proj,0.0003349930,0.05000,9.662 | |
| 21,mlp.down_proj,0.0015875959,0.05000,0.652 | |
| 22,self_attn.k_proj,0.0016932811,0.05000,0.385 | |
| 22,self_attn.q_proj,0.0042630833,0.05000,0.434 | |
| 22,self_attn.v_proj,0.0021211004,0.05000,8.181 | |
| 22,self_attn.o_proj,0.0003815958,0.05000,0.206 | |
| 22,mlp.gate_proj,0.0003353789,0.05000,0.412 | |
| 22,mlp.up_proj,0.0003857626,0.05000,9.671 | |
| 22,mlp.down_proj,0.0018017970,0.05000,0.656 | |
| 23,self_attn.k_proj,0.0022752626,0.05000,0.427 | |
| 23,self_attn.q_proj,0.0050662677,0.05000,0.440 | |
| 23,self_attn.v_proj,0.0026124159,0.05000,9.650 | |
| 23,self_attn.o_proj,0.0004899677,0.05000,0.210 | |
| 23,mlp.gate_proj,0.0003991299,0.05000,0.425 | |
| 23,mlp.up_proj,0.0004568473,0.05000,8.270 | |
| 23,mlp.down_proj,0.0019531925,0.05000,0.656 | |
| 24,self_attn.k_proj,0.0038218261,0.05000,0.400 | |
| 24,self_attn.q_proj,0.0097421070,0.05000,0.438 | |
| 24,self_attn.v_proj,0.0044700833,0.05000,9.649 | |
| 24,self_attn.o_proj,0.0007072901,0.05000,0.211 | |
| 24,mlp.gate_proj,0.0003753161,0.05000,0.459 | |
| 24,mlp.up_proj,0.0004418180,0.05000,9.665 | |
| 24,mlp.down_proj,0.0023237413,0.05000,0.652 | |
| 25,self_attn.k_proj,0.0043164005,0.05000,0.412 | |
| 25,self_attn.q_proj,0.0108171433,0.05000,0.428 | |
| 25,self_attn.v_proj,0.0065032306,0.05000,9.648 | |
| 25,self_attn.o_proj,0.0008021041,0.05000,0.213 | |
| 25,mlp.gate_proj,0.0003432549,0.05000,0.411 | |
| 25,mlp.up_proj,0.0004128897,0.05000,9.662 | |
| 25,mlp.down_proj,0.0027670667,0.05000,0.654 | |
| 26,self_attn.k_proj,0.0038977822,0.05000,0.405 | |
| 26,self_attn.q_proj,0.0104804013,0.05000,0.444 | |
| 26,self_attn.v_proj,0.0056383276,0.05000,8.228 | |
| 26,self_attn.o_proj,0.0016605759,0.05000,0.209 | |
| 26,mlp.gate_proj,0.0003358276,0.05000,0.414 | |
| 26,mlp.up_proj,0.0003946834,0.05000,9.673 | |
| 26,mlp.down_proj,0.0031093943,0.05000,0.653 | |
| 27,self_attn.k_proj,0.0020447240,0.05000,0.412 | |
| 27,self_attn.q_proj,0.0043709083,0.05000,0.437 | |
| 27,self_attn.v_proj,0.0024168304,0.05000,9.666 | |
| 27,self_attn.o_proj,0.0008180637,0.05000,0.213 | |
| 27,mlp.gate_proj,0.0007121118,0.05000,0.417 | |
| 27,mlp.up_proj,0.0006765889,0.05000,8.258 | |
| 27,mlp.down_proj,0.0101041929,0.05000,0.654 | |