|
layer,module,loss,damp,time
|
|
0,self_attn.k_proj,198.69464,0.01000,1.094
|
|
0,self_attn.v_proj,195.76051,0.01000,0.776
|
|
0,self_attn.q_proj,243.30057,0.01000,0.792
|
|
0,self_attn.o_proj,36.38606,0.01000,0.626
|
|
0,mlp.up_proj,13.06959,0.01000,0.789
|
|
0,mlp.gate_proj,13.87642,0.01000,0.792
|
|
0,mlp.down_proj,0.57033,0.01000,3.270
|
|
1,self_attn.k_proj,11.76147,0.01000,0.767
|
|
1,self_attn.v_proj,11.56775,0.01000,0.765
|
|
1,self_attn.q_proj,3.06964,0.01000,0.768
|
|
1,self_attn.o_proj,1.91879,0.01000,0.607
|
|
1,mlp.up_proj,16.77610,0.01000,0.773
|
|
1,mlp.gate_proj,18.79979,0.01000,0.773
|
|
1,mlp.down_proj,0.10125,0.01000,3.253
|
|
2,self_attn.k_proj,13.69234,0.01000,0.760
|
|
2,self_attn.v_proj,13.41772,0.01000,0.757
|
|
2,self_attn.q_proj,6.14136,0.01000,0.770
|
|
2,self_attn.o_proj,2.78490,0.01000,0.609
|
|
2,mlp.up_proj,18.90626,0.01000,0.777
|
|
2,mlp.gate_proj,19.42534,0.01000,0.777
|
|
2,mlp.down_proj,0.20656,0.01000,3.240
|
|
3,self_attn.k_proj,12.26875,0.01000,0.771
|
|
3,self_attn.v_proj,11.49991,0.01000,0.767
|
|
3,self_attn.q_proj,3.87051,0.01000,0.768
|
|
3,self_attn.o_proj,6.08537,0.01000,0.611
|
|
3,mlp.up_proj,27.04681,0.01000,0.781
|
|
3,mlp.gate_proj,27.28091,0.01000,0.783
|
|
3,mlp.down_proj,0.71027,0.01000,3.261
|
|
4,self_attn.k_proj,13.06411,0.01000,0.761
|
|
4,self_attn.v_proj,10.97907,0.01000,0.767
|
|
4,self_attn.q_proj,8.22816,0.01000,0.767
|
|
4,self_attn.o_proj,2.14936,0.01000,0.615
|
|
4,mlp.up_proj,13.32326,0.01000,0.779
|
|
4,mlp.gate_proj,13.68868,0.01000,0.777
|
|
4,mlp.down_proj,0.13622,0.01000,3.269
|
|
5,self_attn.k_proj,10.77550,0.01000,0.769
|
|
5,self_attn.v_proj,5.25996,0.01000,0.766
|
|
5,self_attn.q_proj,1.15328,0.01000,0.770
|
|
5,self_attn.o_proj,0.36760,0.01000,0.620
|
|
5,mlp.up_proj,14.03705,0.01000,0.783
|
|
5,mlp.gate_proj,14.03240,0.01000,0.777
|
|
5,mlp.down_proj,0.09100,0.01000,3.232
|
|
6,self_attn.k_proj,7.06065,0.01000,0.757
|
|
6,self_attn.v_proj,5.88580,0.01000,0.757
|
|
6,self_attn.q_proj,2.05951,0.01000,0.763
|
|
6,self_attn.o_proj,0.54376,0.01000,0.607
|
|
6,mlp.up_proj,13.85581,0.01000,0.775
|
|
6,mlp.gate_proj,13.96360,0.01000,0.774
|
|
6,mlp.down_proj,0.20618,0.01000,3.237
|
|
7,self_attn.k_proj,3.64678,0.01000,0.758
|
|
7,self_attn.v_proj,3.37626,0.01000,0.758
|
|
7,self_attn.q_proj,6.33875,0.01000,0.761
|
|
7,self_attn.o_proj,1.19201,0.01000,0.608
|
|
7,mlp.up_proj,9.08091,0.01000,0.777
|
|
7,mlp.gate_proj,9.16898,0.01000,0.773
|
|
7,mlp.down_proj,0.12787,0.01000,3.235
|
|
8,self_attn.k_proj,2.76998,0.01000,0.763
|
|
8,self_attn.v_proj,2.57230,0.01000,0.757
|
|
8,self_attn.q_proj,3.70224,0.01000,0.758
|
|
8,self_attn.o_proj,0.43583,0.01000,0.608
|
|
8,mlp.up_proj,7.05781,0.01000,0.771
|
|
8,mlp.gate_proj,7.07004,0.01000,0.769
|
|
8,mlp.down_proj,0.12891,0.01000,3.226
|
|
9,self_attn.k_proj,5.24076,0.01000,0.760
|
|
9,self_attn.v_proj,4.81714,0.01000,0.765
|
|
9,self_attn.q_proj,1.28618,0.01000,0.761
|
|
9,self_attn.o_proj,0.43630,0.01000,0.605
|
|
9,mlp.up_proj,4.60663,0.01000,0.775
|
|
9,mlp.gate_proj,4.60346,0.01000,0.769
|
|
9,mlp.down_proj,0.07520,0.01000,3.231
|
|
10,self_attn.k_proj,1.50184,0.01000,0.758
|
|
10,self_attn.v_proj,1.45593,0.01000,0.762
|
|
10,self_attn.q_proj,1.89232,0.01000,0.757
|
|
10,self_attn.o_proj,0.19516,0.01000,0.605
|
|
10,mlp.up_proj,4.09116,0.01000,0.770
|
|
10,mlp.gate_proj,4.13186,0.01000,0.768
|
|
10,mlp.down_proj,0.06140,0.01000,3.245
|
|
11,self_attn.k_proj,3.61625,0.01000,0.762
|
|
11,self_attn.v_proj,2.01000,0.01000,0.757
|
|
11,self_attn.q_proj,0.53930,0.01000,0.766
|
|
11,self_attn.o_proj,0.53488,0.01000,0.605
|
|
11,mlp.up_proj,5.95990,0.01000,0.775
|
|
11,mlp.gate_proj,6.01873,0.01000,0.771
|
|
11,mlp.down_proj,1.49569,0.01000,3.277
|
|
12,self_attn.k_proj,2.09444,0.01000,0.772
|
|
12,self_attn.v_proj,1.75990,0.01000,0.764
|
|
12,self_attn.q_proj,0.98691,0.01000,0.772
|
|
12,self_attn.o_proj,0.32763,0.01000,0.611
|
|
12,mlp.up_proj,2.53169,0.01000,0.784
|
|
12,mlp.gate_proj,2.49588,0.01000,0.783
|
|
12,mlp.down_proj,0.02076,0.01000,3.223
|
|
13,self_attn.k_proj,3.88221,0.01000,0.765
|
|
13,self_attn.v_proj,3.63538,0.01000,0.755
|
|
13,self_attn.q_proj,0.56800,0.01000,0.764
|
|
13,self_attn.o_proj,0.46188,0.01000,0.604
|
|
13,mlp.up_proj,2.62719,0.01000,0.773
|
|
13,mlp.gate_proj,2.61783,0.01000,0.773
|
|
13,mlp.down_proj,0.01987,0.01000,3.300
|
|
14,self_attn.k_proj,1.91174,0.01000,0.778
|
|
14,self_attn.v_proj,1.67628,0.01000,0.773
|
|
14,self_attn.q_proj,0.47230,0.01000,0.768
|
|
14,self_attn.o_proj,0.22776,0.01000,0.621
|
|
14,mlp.up_proj,2.01387,0.01000,0.778
|
|
14,mlp.gate_proj,1.99085,0.01000,0.781
|
|
14,mlp.down_proj,0.00910,0.01000,3.318
|
|
15,self_attn.k_proj,1.71465,0.01000,0.776
|
|
15,self_attn.v_proj,1.51512,0.01000,0.775
|
|
15,self_attn.q_proj,0.28649,0.01000,0.784
|
|
15,self_attn.o_proj,0.16413,0.01000,0.622
|
|
15,mlp.up_proj,4.75803,0.01000,0.795
|
|
15,mlp.gate_proj,4.92565,0.01000,0.793
|
|
15,mlp.down_proj,0.02030,0.01000,3.306
|
|
16,self_attn.k_proj,1.73286,0.01000,0.779
|
|
16,self_attn.v_proj,1.52700,0.01000,0.776
|
|
16,self_attn.q_proj,0.91500,0.01000,0.777
|
|
16,self_attn.o_proj,0.11427,0.01000,0.619
|
|
16,mlp.up_proj,3.70094,0.01000,0.783
|
|
16,mlp.gate_proj,3.71431,0.01000,0.775
|
|
16,mlp.down_proj,0.04519,0.01000,3.253
|
|
17,self_attn.k_proj,0.43938,0.01000,0.762
|
|
17,self_attn.v_proj,0.35879,0.01000,0.763
|
|
17,self_attn.q_proj,0.65869,0.01000,0.765
|
|
17,self_attn.o_proj,0.04037,0.01000,0.611
|
|
17,mlp.up_proj,3.58469,0.01000,0.777
|
|
17,mlp.gate_proj,3.66276,0.01000,0.770
|
|
17,mlp.down_proj,0.02796,0.01000,3.257
|
|
18,self_attn.k_proj,3.42578,0.01000,0.767
|
|
18,self_attn.v_proj,3.09306,0.01000,0.761
|
|
18,self_attn.q_proj,2.25221,0.01000,0.778
|
|
18,self_attn.o_proj,0.24882,0.01000,0.610
|
|
18,mlp.up_proj,4.09926,0.01000,0.779
|
|
18,mlp.gate_proj,4.20446,0.01000,0.773
|
|
18,mlp.down_proj,0.03055,0.01000,3.236
|
|
19,self_attn.k_proj,2.29446,0.01000,0.761
|
|
19,self_attn.v_proj,1.46921,0.01000,0.762
|
|
19,self_attn.q_proj,2.12650,0.01000,0.761
|
|
19,self_attn.o_proj,0.10793,0.01000,0.607
|
|
19,mlp.up_proj,3.87133,0.01000,0.774
|
|
19,mlp.gate_proj,4.02278,0.01000,0.771
|
|
19,mlp.down_proj,0.02028,0.01000,3.260
|
|
20,self_attn.k_proj,6.02629,0.01000,0.766
|
|
20,self_attn.v_proj,5.54468,0.01000,0.758
|
|
20,self_attn.q_proj,1.53195,0.01000,0.763
|
|
20,self_attn.o_proj,0.51680,0.01000,0.612
|
|
20,mlp.up_proj,3.97480,0.01000,0.775
|
|
20,mlp.gate_proj,4.07580,0.01000,0.778
|
|
20,mlp.down_proj,0.02892,0.01000,3.246
|
|
21,self_attn.k_proj,5.52127,0.01000,0.768
|
|
21,self_attn.v_proj,5.55817,0.01000,0.766
|
|
21,self_attn.q_proj,2.16732,0.01000,0.779
|
|
21,self_attn.o_proj,0.71680,0.01000,0.611
|
|
21,mlp.up_proj,5.24819,0.01000,0.785
|
|
21,mlp.gate_proj,5.41273,0.01000,0.785
|
|
21,mlp.down_proj,0.04581,0.01000,3.246
|
|
22,self_attn.k_proj,5.04561,0.01000,0.764
|
|
22,self_attn.v_proj,4.48255,0.01000,0.761
|
|
22,self_attn.q_proj,2.35098,0.01000,0.762
|
|
22,self_attn.o_proj,0.48656,0.01000,0.606
|
|
22,mlp.up_proj,6.14334,0.01000,0.778
|
|
22,mlp.gate_proj,6.36109,0.01000,0.772
|
|
22,mlp.down_proj,0.08612,0.01000,3.247
|
|
23,self_attn.k_proj,4.16688,0.01000,0.767
|
|
23,self_attn.v_proj,4.31470,0.01000,0.766
|
|
23,self_attn.q_proj,0.69882,0.01000,0.763
|
|
23,self_attn.o_proj,0.37936,0.01000,0.613
|
|
23,mlp.up_proj,8.11542,0.01000,0.780
|
|
23,mlp.gate_proj,8.28101,0.01000,0.775
|
|
23,mlp.down_proj,0.09309,0.01000,3.265
|
|
24,self_attn.k_proj,8.86272,0.01000,0.761
|
|
24,self_attn.v_proj,8.50640,0.01000,0.760
|
|
24,self_attn.q_proj,6.60116,0.01000,0.762
|
|
24,self_attn.o_proj,0.78601,0.01000,0.612
|
|
24,mlp.up_proj,8.48724,0.01000,0.778
|
|
24,mlp.gate_proj,8.67515,0.01000,0.772
|
|
24,mlp.down_proj,0.05045,0.01000,3.243
|
|
25,self_attn.k_proj,20.85596,0.01000,0.763
|
|
25,self_attn.v_proj,20.31687,0.01000,0.760
|
|
25,self_attn.q_proj,4.40460,0.01000,0.765
|
|
25,self_attn.o_proj,0.96945,0.01000,0.619
|
|
25,mlp.up_proj,8.51875,0.01000,0.793
|
|
25,mlp.gate_proj,8.63196,0.01000,0.790
|
|
25,mlp.down_proj,0.06100,0.01000,3.293
|
|
26,self_attn.k_proj,3.44908,0.01000,0.776
|
|
26,self_attn.v_proj,3.70904,0.01000,0.776
|
|
26,self_attn.q_proj,5.38957,0.01000,0.776
|
|
26,self_attn.o_proj,0.09136,0.01000,0.617
|
|
26,mlp.up_proj,7.22075,0.01000,0.787
|
|
26,mlp.gate_proj,7.31307,0.01000,0.788
|
|
26,mlp.down_proj,0.03320,0.01000,3.299
|
|
27,self_attn.k_proj,3.16697,0.01000,0.778
|
|
27,self_attn.v_proj,2.71902,0.01000,0.772
|
|
27,self_attn.q_proj,6.13490,0.01000,0.776
|
|
27,self_attn.o_proj,0.42601,0.01000,0.617
|
|
27,mlp.up_proj,6.95249,0.01000,0.790
|
|
27,mlp.gate_proj,7.11151,0.01000,0.789
|
|
27,mlp.down_proj,0.10148,0.01000,3.296
|
|
28,self_attn.k_proj,5.35555,0.01000,0.774
|
|
28,self_attn.v_proj,5.28846,0.01000,0.774
|
|
28,self_attn.q_proj,7.92698,0.01000,0.780
|
|
28,self_attn.o_proj,0.21795,0.01000,0.616
|
|
28,mlp.up_proj,4.31994,0.01000,0.790
|
|
28,mlp.gate_proj,4.40171,0.01000,0.777
|
|
28,mlp.down_proj,0.03607,0.01000,3.242
|
|
29,self_attn.k_proj,1.51074,0.01000,0.767
|
|
29,self_attn.v_proj,2.13929,0.01000,0.761
|
|
29,self_attn.q_proj,1.33246,0.01000,0.762
|
|
29,self_attn.o_proj,0.01362,0.01000,0.621
|
|
29,mlp.up_proj,2.46330,0.01000,0.779
|
|
29,mlp.gate_proj,2.51679,0.01000,0.771
|
|
29,mlp.down_proj,0.01289,0.01000,3.285
|
|
30,self_attn.k_proj,6.86594,0.01000,0.774
|
|
30,self_attn.v_proj,7.52277,0.01000,0.772
|
|
30,self_attn.q_proj,0.92430,0.01000,0.779
|
|
30,self_attn.o_proj,0.15717,0.01000,0.618
|
|
30,mlp.up_proj,5.04547,0.01000,0.785
|
|
30,mlp.gate_proj,5.15212,0.01000,0.782
|
|
30,mlp.down_proj,0.04664,0.01000,3.287
|
|
31,self_attn.k_proj,25.90375,0.01000,0.775
|
|
31,self_attn.v_proj,20.06681,0.01000,0.774
|
|
31,self_attn.q_proj,7.96819,0.01000,0.775
|
|
31,self_attn.o_proj,3.03762,0.01000,0.620
|
|
31,mlp.up_proj,8.97430,0.01000,0.789
|
|
31,mlp.gate_proj,9.35650,0.01000,0.788
|
|
31,mlp.down_proj,0.20598,0.01000,3.297
|
|
32,self_attn.k_proj,2.33364,0.01000,0.776
|
|
32,self_attn.v_proj,2.47755,0.01000,0.776
|
|
32,self_attn.q_proj,3.65308,0.01000,0.773
|
|
32,self_attn.o_proj,0.12603,0.01000,0.618
|
|
32,mlp.up_proj,7.92819,0.01000,0.788
|
|
32,mlp.gate_proj,8.39347,0.01000,0.783
|
|
32,mlp.down_proj,0.07191,0.01000,3.293
|
|
33,self_attn.k_proj,3.03554,0.01000,0.774
|
|
33,self_attn.v_proj,3.00391,0.01000,0.773
|
|
33,self_attn.q_proj,4.58165,0.01000,0.774
|
|
33,self_attn.o_proj,0.56861,0.01000,0.623
|
|
33,mlp.up_proj,13.49779,0.01000,0.789
|
|
33,mlp.gate_proj,13.66948,0.01000,0.787
|
|
33,mlp.down_proj,0.34180,0.01000,3.298
|
|
|