chieunq's picture
Upload folder using huggingface_hub
2c3fa00 verified
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.0000001286,0.05000,0.569
0,self_attn.q_proj,0.0000002646,0.05000,0.475
0,self_attn.v_proj,0.0000001136,0.05000,9.847
0,self_attn.o_proj,0.0000003787,0.05000,0.208
0,mlp.gate_proj,0.0000030995,0.05000,0.433
0,mlp.up_proj,0.0000020126,0.05000,9.667
0,mlp.down_proj,0.0000005277,0.05000,0.688
1,self_attn.k_proj,0.0000000902,0.05000,0.378
1,self_attn.q_proj,0.0000001889,0.05000,0.430
1,self_attn.v_proj,0.0000000910,0.05000,9.661
1,self_attn.o_proj,0.0000001557,0.05000,0.216
1,mlp.gate_proj,0.0000554367,0.05000,0.393
1,mlp.up_proj,0.0000223800,0.05000,9.681
1,mlp.down_proj,0.0000009195,0.05000,0.664
2,self_attn.k_proj,0.0000001894,0.05000,0.415
2,self_attn.q_proj,0.0000004174,0.05000,0.487
2,self_attn.v_proj,0.0000001915,0.05000,8.161
2,self_attn.o_proj,0.0000002722,0.05000,0.207
2,mlp.gate_proj,0.0000472408,0.05000,0.393
2,mlp.up_proj,0.0000191339,0.05000,9.683
2,mlp.down_proj,0.0099027801,0.05000,0.647
3,self_attn.k_proj,0.0000014196,0.05000,0.393
3,self_attn.q_proj,0.0000028513,0.05000,0.445
3,self_attn.v_proj,0.0000014696,0.05000,9.661
3,self_attn.o_proj,0.0000005255,0.05000,0.212
3,mlp.gate_proj,0.0000556838,0.05000,0.403
3,mlp.up_proj,0.0000240990,0.05000,8.305
3,mlp.down_proj,0.0000016354,0.05000,0.651
4,self_attn.k_proj,0.0000013536,0.05000,0.406
4,self_attn.q_proj,0.0000028432,0.05000,0.422
4,self_attn.v_proj,0.0000015019,0.05000,9.641
4,self_attn.o_proj,0.0000009051,0.05000,0.217
4,mlp.gate_proj,0.0000505280,0.05000,0.420
4,mlp.up_proj,0.0000238862,0.05000,9.680
4,mlp.down_proj,0.0000022756,0.05000,0.656
5,self_attn.k_proj,0.0000018439,0.05000,0.416
5,self_attn.q_proj,0.0000041231,0.05000,0.428
5,self_attn.v_proj,0.0000020115,0.05000,9.656
5,self_attn.o_proj,0.0000011567,0.05000,0.217
5,mlp.gate_proj,0.0000228395,0.05000,0.449
5,mlp.up_proj,0.0000156479,0.05000,9.683
5,mlp.down_proj,0.0000032556,0.05000,0.653
6,self_attn.k_proj,0.0000016667,0.05000,0.392
6,self_attn.q_proj,0.0000034560,0.05000,0.464
6,self_attn.v_proj,0.0000016042,0.05000,8.174
6,self_attn.o_proj,0.0000013321,0.05000,0.208
6,mlp.gate_proj,0.0000317576,0.05000,0.424
6,mlp.up_proj,0.0000222448,0.05000,9.677
6,mlp.down_proj,0.0000047190,0.05000,0.651
7,self_attn.k_proj,0.0000034871,0.05000,0.409
7,self_attn.q_proj,0.0000079519,0.05000,0.418
7,self_attn.v_proj,0.0000039857,0.05000,9.642
7,self_attn.o_proj,0.0000019424,0.05000,0.212
7,mlp.gate_proj,0.0000451046,0.05000,0.392
7,mlp.up_proj,0.0000298035,0.05000,8.257
7,mlp.down_proj,0.0000054742,0.05000,0.653
8,self_attn.k_proj,0.0000048507,0.05000,0.388
8,self_attn.q_proj,0.0000100572,0.05000,0.422
8,self_attn.v_proj,0.0000045682,0.05000,9.650
8,self_attn.o_proj,0.0000016871,0.05000,0.212
8,mlp.gate_proj,0.0000407348,0.05000,0.412
8,mlp.up_proj,0.0000301114,0.05000,9.659
8,mlp.down_proj,0.0000070363,0.05000,0.652
9,self_attn.k_proj,0.0000098412,0.05000,0.387
9,self_attn.q_proj,0.0000214254,0.05000,0.426
9,self_attn.v_proj,0.0000094100,0.05000,9.654
9,self_attn.o_proj,0.0000050124,0.05000,0.213
9,mlp.gate_proj,0.0000392365,0.05000,0.422
9,mlp.up_proj,0.0000317824,0.05000,9.680
9,mlp.down_proj,0.0000100710,0.05000,0.650
10,self_attn.k_proj,0.0000077404,0.05000,0.381
10,self_attn.q_proj,0.0000169567,0.05000,0.419
10,self_attn.v_proj,0.0000080448,0.05000,8.179
10,self_attn.o_proj,0.0000045071,0.05000,0.207
10,mlp.gate_proj,0.0000393384,0.05000,0.434
10,mlp.up_proj,0.0000329698,0.05000,9.667
10,mlp.down_proj,0.0000156726,0.05000,0.665
11,self_attn.k_proj,0.0000159419,0.05000,0.388
11,self_attn.q_proj,0.0000354457,0.05000,0.413
11,self_attn.v_proj,0.0000139918,0.05000,9.658
11,self_attn.o_proj,0.0000126698,0.05000,0.210
11,mlp.gate_proj,0.0000352747,0.05000,0.440
11,mlp.up_proj,0.0000340574,0.05000,8.291
11,mlp.down_proj,0.0000195205,0.05000,0.649
12,self_attn.k_proj,0.0000159710,0.05000,0.384
12,self_attn.q_proj,0.0000356597,0.05000,0.429
12,self_attn.v_proj,0.0000159614,0.05000,9.662
12,self_attn.o_proj,0.0000078580,0.05000,0.212
12,mlp.gate_proj,0.0000364643,0.05000,0.406
12,mlp.up_proj,0.0000370203,0.05000,9.680
12,mlp.down_proj,0.0000224948,0.05000,0.655
13,self_attn.k_proj,0.0000212178,0.05000,0.393
13,self_attn.q_proj,0.0000546827,0.05000,0.444
13,self_attn.v_proj,0.0000230411,0.05000,9.652
13,self_attn.o_proj,0.0000118011,0.05000,0.213
13,mlp.gate_proj,0.0000409560,0.05000,0.412
13,mlp.up_proj,0.0000416904,0.05000,9.670
13,mlp.down_proj,0.0000318613,0.05000,0.654
14,self_attn.k_proj,0.0000363028,0.05000,0.446
14,self_attn.q_proj,0.0000869382,0.05000,0.423
14,self_attn.v_proj,0.0000376178,0.05000,8.239
14,self_attn.o_proj,0.0000167371,0.05000,0.206
14,mlp.gate_proj,0.0000454664,0.05000,0.443
14,mlp.up_proj,0.0000474814,0.05000,9.673
14,mlp.down_proj,0.0000445586,0.05000,0.650
15,self_attn.k_proj,0.0000688017,0.05000,0.447
15,self_attn.q_proj,0.0001997899,0.05000,0.497
15,self_attn.v_proj,0.0000827729,0.05000,9.652
15,self_attn.o_proj,0.0000320234,0.05000,0.214
15,mlp.gate_proj,0.0000528398,0.05000,0.455
15,mlp.up_proj,0.0000566378,0.05000,8.255
15,mlp.down_proj,0.0000653121,0.05000,0.649
16,self_attn.k_proj,0.0001001867,0.05000,0.429
16,self_attn.q_proj,0.0002616168,0.05000,0.451
16,self_attn.v_proj,0.0000959632,0.05000,9.640
16,self_attn.o_proj,0.0000444373,0.05000,0.211
16,mlp.gate_proj,0.0000633158,0.05000,0.443
16,mlp.up_proj,0.0000730107,0.05000,9.669
16,mlp.down_proj,0.0001600736,0.05000,0.649
17,self_attn.k_proj,0.0002788753,0.05000,0.421
17,self_attn.q_proj,0.0007597560,0.05000,0.434
17,self_attn.v_proj,0.0003315294,0.05000,9.658
17,self_attn.o_proj,0.0001125035,0.05000,0.214
17,mlp.gate_proj,0.0000975621,0.05000,0.409
17,mlp.up_proj,0.0001136578,0.05000,9.672
17,mlp.down_proj,0.0002273930,0.05000,0.653
18,self_attn.k_proj,0.0002986319,0.05000,0.443
18,self_attn.q_proj,0.0008368891,0.05000,0.437
18,self_attn.v_proj,0.0003074740,0.05000,8.188
18,self_attn.o_proj,0.0000965470,0.05000,0.207
18,mlp.gate_proj,0.0001294523,0.05000,0.396
18,mlp.up_proj,0.0001504320,0.05000,9.665
18,mlp.down_proj,0.0004062122,0.05000,0.657
19,self_attn.k_proj,0.0005055367,0.05000,0.408
19,self_attn.q_proj,0.0014725006,0.05000,0.417
19,self_attn.v_proj,0.0005765656,0.05000,9.634
19,self_attn.o_proj,0.0002112224,0.05000,0.212
19,mlp.gate_proj,0.0001672620,0.05000,0.420
19,mlp.up_proj,0.0002034081,0.05000,7.917
19,mlp.down_proj,0.0007933816,0.05000,0.659
20,self_attn.k_proj,0.0008494559,0.05000,0.398
20,self_attn.q_proj,0.0023191713,0.05000,0.433
20,self_attn.v_proj,0.0009429085,0.05000,9.647
20,self_attn.o_proj,0.0003886604,0.05000,0.210
20,mlp.gate_proj,0.0002268225,0.05000,0.415
20,mlp.up_proj,0.0002673458,0.05000,9.676
20,mlp.down_proj,0.0010970989,0.05000,0.652
21,self_attn.k_proj,0.0013209661,0.05000,0.463
21,self_attn.q_proj,0.0033686485,0.05000,0.538
21,self_attn.v_proj,0.0015625238,0.05000,9.667
21,self_attn.o_proj,0.0004073506,0.05000,0.210
21,mlp.gate_proj,0.0002858517,0.05000,0.411
21,mlp.up_proj,0.0003349930,0.05000,9.662
21,mlp.down_proj,0.0015875959,0.05000,0.652
22,self_attn.k_proj,0.0016932811,0.05000,0.385
22,self_attn.q_proj,0.0042630833,0.05000,0.434
22,self_attn.v_proj,0.0021211004,0.05000,8.181
22,self_attn.o_proj,0.0003815958,0.05000,0.206
22,mlp.gate_proj,0.0003353789,0.05000,0.412
22,mlp.up_proj,0.0003857626,0.05000,9.671
22,mlp.down_proj,0.0018017970,0.05000,0.656
23,self_attn.k_proj,0.0022752626,0.05000,0.427
23,self_attn.q_proj,0.0050662677,0.05000,0.440
23,self_attn.v_proj,0.0026124159,0.05000,9.650
23,self_attn.o_proj,0.0004899677,0.05000,0.210
23,mlp.gate_proj,0.0003991299,0.05000,0.425
23,mlp.up_proj,0.0004568473,0.05000,8.270
23,mlp.down_proj,0.0019531925,0.05000,0.656
24,self_attn.k_proj,0.0038218261,0.05000,0.400
24,self_attn.q_proj,0.0097421070,0.05000,0.438
24,self_attn.v_proj,0.0044700833,0.05000,9.649
24,self_attn.o_proj,0.0007072901,0.05000,0.211
24,mlp.gate_proj,0.0003753161,0.05000,0.459
24,mlp.up_proj,0.0004418180,0.05000,9.665
24,mlp.down_proj,0.0023237413,0.05000,0.652
25,self_attn.k_proj,0.0043164005,0.05000,0.412
25,self_attn.q_proj,0.0108171433,0.05000,0.428
25,self_attn.v_proj,0.0065032306,0.05000,9.648
25,self_attn.o_proj,0.0008021041,0.05000,0.213
25,mlp.gate_proj,0.0003432549,0.05000,0.411
25,mlp.up_proj,0.0004128897,0.05000,9.662
25,mlp.down_proj,0.0027670667,0.05000,0.654
26,self_attn.k_proj,0.0038977822,0.05000,0.405
26,self_attn.q_proj,0.0104804013,0.05000,0.444
26,self_attn.v_proj,0.0056383276,0.05000,8.228
26,self_attn.o_proj,0.0016605759,0.05000,0.209
26,mlp.gate_proj,0.0003358276,0.05000,0.414
26,mlp.up_proj,0.0003946834,0.05000,9.673
26,mlp.down_proj,0.0031093943,0.05000,0.653
27,self_attn.k_proj,0.0020447240,0.05000,0.412
27,self_attn.q_proj,0.0043709083,0.05000,0.437
27,self_attn.v_proj,0.0024168304,0.05000,9.666
27,self_attn.o_proj,0.0008180637,0.05000,0.213
27,mlp.gate_proj,0.0007121118,0.05000,0.417
27,mlp.up_proj,0.0006765889,0.05000,8.258
27,mlp.down_proj,0.0101041929,0.05000,0.654