|
layer,module,loss,damp,time
|
|
0,self_attn.k_proj,0.42746,0.01000,1.298
|
|
0,self_attn.v_proj,0.00322,0.01000,1.145
|
|
0,self_attn.q_proj,0.59539,0.01000,1.194
|
|
0,self_attn.o_proj,0.00019,0.01000,1.172
|
|
0,mlp.up_proj,0.23273,0.01000,1.245
|
|
0,mlp.gate_proj,0.28538,0.01000,1.268
|
|
0,mlp.down_proj,0.00092,0.01000,4.726
|
|
1,self_attn.k_proj,0.25741,0.01000,1.185
|
|
1,self_attn.v_proj,0.00849,0.01000,1.166
|
|
1,self_attn.q_proj,0.44868,0.01000,1.207
|
|
1,self_attn.o_proj,0.00059,0.01000,1.188
|
|
1,mlp.up_proj,0.42066,0.01000,1.262
|
|
1,mlp.gate_proj,0.50823,0.01000,1.260
|
|
1,mlp.down_proj,0.05587,0.01000,4.725
|
|
2,self_attn.k_proj,1.36904,0.01000,1.138
|
|
2,self_attn.v_proj,0.04992,0.01000,1.144
|
|
2,self_attn.q_proj,1.96132,0.01000,1.158
|
|
2,self_attn.o_proj,0.00073,0.01000,1.180
|
|
2,mlp.up_proj,0.70970,0.01000,1.240
|
|
2,mlp.gate_proj,0.91449,0.01000,1.231
|
|
2,mlp.down_proj,0.00373,0.01000,4.664
|
|
3,self_attn.k_proj,1.16119,0.01000,1.121
|
|
3,self_attn.v_proj,0.09106,0.01000,1.146
|
|
3,self_attn.q_proj,1.95196,0.01000,1.143
|
|
3,self_attn.o_proj,0.00155,0.01000,1.156
|
|
3,mlp.up_proj,0.97830,0.01000,1.230
|
|
3,mlp.gate_proj,1.47659,0.01000,1.216
|
|
3,mlp.down_proj,0.00699,0.01000,4.565
|
|
4,self_attn.k_proj,1.07471,0.01000,1.120
|
|
4,self_attn.v_proj,0.08962,0.01000,1.119
|
|
4,self_attn.q_proj,1.77537,0.01000,1.156
|
|
4,self_attn.o_proj,0.00395,0.01000,1.143
|
|
4,mlp.up_proj,1.25910,0.01000,1.208
|
|
4,mlp.gate_proj,2.20183,0.01000,1.246
|
|
4,mlp.down_proj,0.01210,0.01000,4.601
|
|
5,self_attn.k_proj,1.79082,0.01000,1.146
|
|
5,self_attn.v_proj,0.08954,0.01000,1.123
|
|
5,self_attn.q_proj,2.67382,0.01000,1.144
|
|
5,self_attn.o_proj,0.00405,0.01000,1.175
|
|
5,mlp.up_proj,1.55323,0.01000,1.223
|
|
5,mlp.gate_proj,2.69463,0.01000,1.212
|
|
5,mlp.down_proj,0.01728,0.01000,4.590
|
|
6,self_attn.k_proj,1.46103,0.01000,1.112
|
|
6,self_attn.v_proj,0.10099,0.01000,1.127
|
|
6,self_attn.q_proj,2.45505,0.01000,1.134
|
|
6,self_attn.o_proj,0.00666,0.01000,1.139
|
|
6,mlp.up_proj,1.70162,0.01000,1.274
|
|
6,mlp.gate_proj,3.00450,0.01000,1.206
|
|
6,mlp.down_proj,0.02088,0.01000,4.627
|
|
7,self_attn.k_proj,1.48093,0.01000,1.116
|
|
7,self_attn.v_proj,0.10914,0.01000,1.116
|
|
7,self_attn.q_proj,2.32144,0.01000,1.132
|
|
7,self_attn.o_proj,0.00948,0.01000,1.159
|
|
7,mlp.up_proj,1.85436,0.01000,1.252
|
|
7,mlp.gate_proj,3.05631,0.01000,1.202
|
|
7,mlp.down_proj,0.02436,0.01000,4.582
|
|
8,self_attn.k_proj,1.94325,0.01000,1.125
|
|
8,self_attn.v_proj,0.14212,0.01000,1.100
|
|
8,self_attn.q_proj,2.95584,0.01000,1.139
|
|
8,self_attn.o_proj,0.01252,0.01000,1.124
|
|
8,mlp.up_proj,1.98400,0.01000,1.205
|
|
8,mlp.gate_proj,3.33098,0.01000,1.199
|
|
8,mlp.down_proj,0.02670,0.01000,4.623
|
|
9,self_attn.k_proj,1.88189,0.01000,1.144
|
|
9,self_attn.v_proj,0.20366,0.01000,1.121
|
|
9,self_attn.q_proj,2.93669,0.01000,1.155
|
|
9,self_attn.o_proj,0.01573,0.01000,1.162
|
|
9,mlp.up_proj,2.08006,0.01000,1.287
|
|
9,mlp.gate_proj,3.52270,0.01000,1.222
|
|
9,mlp.down_proj,0.02895,0.01000,4.640
|
|
10,self_attn.k_proj,2.27381,0.01000,1.121
|
|
10,self_attn.v_proj,0.15105,0.01000,1.121
|
|
10,self_attn.q_proj,3.48119,0.01000,1.148
|
|
10,self_attn.o_proj,0.01408,0.01000,1.158
|
|
10,mlp.up_proj,2.16419,0.01000,1.264
|
|
10,mlp.gate_proj,3.39999,0.01000,1.205
|
|
10,mlp.down_proj,0.03022,0.01000,4.639
|
|
11,self_attn.k_proj,2.07252,0.01000,1.139
|
|
11,self_attn.v_proj,0.16126,0.01000,1.109
|
|
11,self_attn.q_proj,3.02845,0.01000,1.154
|
|
11,self_attn.o_proj,0.01404,0.01000,1.161
|
|
11,mlp.up_proj,2.27135,0.01000,1.282
|
|
11,mlp.gate_proj,3.44862,0.01000,1.208
|
|
11,mlp.down_proj,0.03207,0.01000,4.564
|
|
12,self_attn.k_proj,1.60538,0.01000,1.117
|
|
12,self_attn.v_proj,0.19192,0.01000,1.108
|
|
12,self_attn.q_proj,2.62414,0.01000,1.129
|
|
12,self_attn.o_proj,0.01902,0.01000,1.145
|
|
12,mlp.up_proj,2.29499,0.01000,1.253
|
|
12,mlp.gate_proj,3.29678,0.01000,1.236
|
|
12,mlp.down_proj,0.03569,0.01000,4.594
|
|
13,self_attn.k_proj,2.38634,0.01000,1.111
|
|
13,self_attn.v_proj,0.20405,0.01000,1.123
|
|
13,self_attn.q_proj,3.38319,0.01000,1.160
|
|
13,self_attn.o_proj,0.02028,0.01000,1.156
|
|
13,mlp.up_proj,2.41499,0.01000,1.205
|
|
13,mlp.gate_proj,3.49100,0.01000,1.219
|
|
13,mlp.down_proj,0.04046,0.01000,4.586
|
|
14,self_attn.k_proj,2.54345,0.01000,1.118
|
|
14,self_attn.v_proj,0.21222,0.01000,1.109
|
|
14,self_attn.q_proj,3.39434,0.01000,1.137
|
|
14,self_attn.o_proj,0.02202,0.01000,1.146
|
|
14,mlp.up_proj,2.63057,0.01000,1.253
|
|
14,mlp.gate_proj,4.05357,0.01000,1.202
|
|
14,mlp.down_proj,0.05063,0.01000,4.578
|
|
15,self_attn.k_proj,2.37138,0.01000,1.122
|
|
15,self_attn.v_proj,0.26364,0.01000,1.124
|
|
15,self_attn.q_proj,4.12155,0.01000,1.128
|
|
15,self_attn.o_proj,0.02747,0.01000,1.154
|
|
15,mlp.up_proj,2.79545,0.01000,1.272
|
|
15,mlp.gate_proj,4.58567,0.01000,1.206
|
|
15,mlp.down_proj,0.06211,0.01000,4.629
|
|
16,self_attn.k_proj,2.48672,0.01000,1.118
|
|
16,self_attn.v_proj,0.23719,0.01000,1.126
|
|
16,self_attn.q_proj,3.82693,0.01000,1.153
|
|
16,self_attn.o_proj,0.02067,0.01000,1.184
|
|
16,mlp.up_proj,3.02743,0.01000,1.234
|
|
16,mlp.gate_proj,5.28880,0.01000,1.224
|
|
16,mlp.down_proj,0.06787,0.01000,4.618
|
|
17,self_attn.k_proj,2.72810,0.01000,1.133
|
|
17,self_attn.v_proj,0.26371,0.01000,1.107
|
|
17,self_attn.q_proj,4.06875,0.01000,1.143
|
|
17,self_attn.o_proj,0.01875,0.01000,1.138
|
|
17,mlp.up_proj,3.14924,0.01000,1.208
|
|
17,mlp.gate_proj,5.65233,0.01000,1.210
|
|
17,mlp.down_proj,0.07761,0.01000,4.663
|
|
18,self_attn.k_proj,3.08600,0.01000,1.108
|
|
18,self_attn.v_proj,0.26879,0.01000,1.102
|
|
18,self_attn.q_proj,4.17190,0.01000,1.138
|
|
18,self_attn.o_proj,0.01298,0.01000,1.143
|
|
18,mlp.up_proj,3.34775,0.01000,1.220
|
|
18,mlp.gate_proj,6.07418,0.01000,1.205
|
|
18,mlp.down_proj,0.07685,0.01000,4.580
|
|
19,self_attn.k_proj,2.78422,0.01000,1.106
|
|
19,self_attn.v_proj,0.29603,0.01000,1.114
|
|
19,self_attn.q_proj,4.27470,0.01000,1.138
|
|
19,self_attn.o_proj,0.01093,0.01000,1.152
|
|
19,mlp.up_proj,3.49393,0.01000,1.267
|
|
19,mlp.gate_proj,6.46843,0.01000,1.217
|
|
19,mlp.down_proj,0.08123,0.01000,4.633
|
|
20,self_attn.k_proj,3.06023,0.01000,1.128
|
|
20,self_attn.v_proj,0.31687,0.01000,1.097
|
|
20,self_attn.q_proj,4.43400,0.01000,1.137
|
|
20,self_attn.o_proj,0.01376,0.01000,1.145
|
|
20,mlp.up_proj,3.77894,0.01000,1.238
|
|
20,mlp.gate_proj,6.94192,0.01000,1.206
|
|
20,mlp.down_proj,0.08805,0.01000,4.574
|
|
21,self_attn.k_proj,3.02578,0.01000,1.123
|
|
21,self_attn.v_proj,0.34842,0.01000,1.101
|
|
21,self_attn.q_proj,4.26813,0.01000,1.130
|
|
21,self_attn.o_proj,0.01654,0.01000,1.149
|
|
21,mlp.up_proj,4.02334,0.01000,1.208
|
|
21,mlp.gate_proj,7.47360,0.01000,1.208
|
|
21,mlp.down_proj,0.10173,0.01000,4.560
|
|
22,self_attn.k_proj,3.21109,0.01000,1.107
|
|
22,self_attn.v_proj,0.40353,0.01000,1.103
|
|
22,self_attn.q_proj,4.31625,0.01000,1.148
|
|
22,self_attn.o_proj,0.01620,0.01000,1.140
|
|
22,mlp.up_proj,4.21165,0.01000,1.244
|
|
22,mlp.gate_proj,7.74982,0.01000,1.227
|
|
22,mlp.down_proj,0.10385,0.01000,4.593
|
|
23,self_attn.k_proj,3.13089,0.01000,1.121
|
|
23,self_attn.v_proj,0.44445,0.01000,1.108
|
|
23,self_attn.q_proj,4.53023,0.01000,1.142
|
|
23,self_attn.o_proj,0.01677,0.01000,1.150
|
|
23,mlp.up_proj,4.45875,0.01000,1.295
|
|
23,mlp.gate_proj,8.15389,0.01000,1.227
|
|
23,mlp.down_proj,0.11010,0.01000,4.551
|
|
24,self_attn.k_proj,3.09817,0.01000,1.117
|
|
24,self_attn.v_proj,0.56140,0.01000,1.104
|
|
24,self_attn.q_proj,4.55197,0.01000,1.138
|
|
24,self_attn.o_proj,0.01750,0.01000,1.140
|
|
24,mlp.up_proj,4.73548,0.01000,1.278
|
|
24,mlp.gate_proj,8.65579,0.01000,1.217
|
|
24,mlp.down_proj,0.11689,0.01000,4.614
|
|
25,self_attn.k_proj,2.89024,0.01000,1.112
|
|
25,self_attn.v_proj,0.58672,0.01000,1.098
|
|
25,self_attn.q_proj,4.54099,0.01000,1.139
|
|
25,self_attn.o_proj,0.01983,0.01000,1.147
|
|
25,mlp.up_proj,5.09005,0.01000,1.256
|
|
25,mlp.gate_proj,9.27115,0.01000,1.246
|
|
25,mlp.down_proj,0.13050,0.01000,4.618
|
|
26,self_attn.k_proj,3.09196,0.01000,1.126
|
|
26,self_attn.v_proj,0.55225,0.01000,1.108
|
|
26,self_attn.q_proj,4.40156,0.01000,1.133
|
|
26,self_attn.o_proj,0.02839,0.01000,1.124
|
|
26,mlp.up_proj,5.50463,0.01000,1.222
|
|
26,mlp.gate_proj,10.03537,0.01000,1.201
|
|
26,mlp.down_proj,0.14945,0.01000,4.577
|
|
27,self_attn.k_proj,3.41508,0.01000,1.113
|
|
27,self_attn.v_proj,0.81567,0.01000,1.108
|
|
27,self_attn.q_proj,4.62589,0.01000,1.135
|
|
27,self_attn.o_proj,0.03718,0.01000,1.156
|
|
27,mlp.up_proj,6.03421,0.01000,1.262
|
|
27,mlp.gate_proj,10.88744,0.01000,1.208
|
|
27,mlp.down_proj,0.17776,0.01000,4.577
|
|
28,self_attn.k_proj,2.67063,0.01000,1.113
|
|
28,self_attn.v_proj,0.71694,0.01000,1.104
|
|
28,self_attn.q_proj,4.29881,0.01000,1.164
|
|
28,self_attn.o_proj,0.05667,0.01000,1.135
|
|
28,mlp.up_proj,6.71101,0.01000,1.285
|
|
28,mlp.gate_proj,11.49661,0.01000,1.228
|
|
28,mlp.down_proj,0.23139,0.01000,4.585
|
|
29,self_attn.k_proj,2.80025,0.01000,1.106
|
|
29,self_attn.v_proj,0.89157,0.01000,1.097
|
|
29,self_attn.q_proj,4.54988,0.01000,1.133
|
|
29,self_attn.o_proj,0.05056,0.01000,1.137
|
|
29,mlp.up_proj,7.20778,0.01000,1.251
|
|
29,mlp.gate_proj,11.64608,0.01000,1.200
|
|
29,mlp.down_proj,0.31413,0.01000,4.578
|
|
30,self_attn.k_proj,2.79350,0.01000,1.114
|
|
30,self_attn.v_proj,1.19605,0.01000,1.108
|
|
30,self_attn.q_proj,4.14300,0.01000,1.136
|
|
30,self_attn.o_proj,0.09164,0.01000,1.139
|
|
30,mlp.up_proj,7.67613,0.01000,1.214
|
|
30,mlp.gate_proj,12.59885,0.01000,1.208
|
|
30,mlp.down_proj,0.48913,0.01000,4.572
|
|
31,self_attn.k_proj,2.00682,0.01000,1.122
|
|
31,self_attn.v_proj,0.74282,0.01000,1.100
|
|
31,self_attn.q_proj,3.63397,0.01000,1.148
|
|
31,self_attn.o_proj,0.16117,0.01000,1.136
|
|
31,mlp.up_proj,7.21422,0.01000,1.251
|
|
31,mlp.gate_proj,11.19762,0.01000,1.204
|
|
31,mlp.down_proj,1.27110,0.01000,4.613
|
|
|