File size: 7,090 Bytes
d623dc8
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
layer,module,loss,damp,time
0,self_attn.k_proj,0.92654,0.05000,0.383
0,self_attn.v_proj,0.01888,0.05000,0.240
0,self_attn.q_proj,5.94556,0.05000,0.247
0,self_attn.o_proj,0.00328,0.05000,0.243
0,mlp.up_proj,83.26855,0.05000,0.262
0,mlp.gate_proj,136.41730,0.05000,0.263
0,mlp.down_proj,1.34092,0.05000,1.380
1,self_attn.k_proj,8.95209,0.05000,0.241
1,self_attn.v_proj,0.85154,0.05000,0.238
1,self_attn.q_proj,31.03757,0.05000,0.245
1,self_attn.o_proj,0.58207,0.05000,0.239
1,mlp.up_proj,95.90676,0.05000,0.259
1,mlp.gate_proj,183.64766,0.05000,0.261
1,mlp.down_proj,1.14676,0.05000,1.345
2,self_attn.k_proj,17.36003,0.05000,0.242
2,self_attn.v_proj,2.11829,0.05000,0.246
2,self_attn.q_proj,59.42081,0.05000,0.248
2,self_attn.o_proj,0.41101,0.05000,0.252
2,mlp.up_proj,138.37152,0.05000,0.267
2,mlp.gate_proj,258.27576,0.05000,0.265
2,mlp.down_proj,87.07992,0.05000,1.390
3,self_attn.k_proj,21.04375,0.05000,0.240
3,self_attn.v_proj,4.92936,0.05000,0.245
3,self_attn.q_proj,83.55756,0.05000,0.250
3,self_attn.o_proj,0.64188,0.05000,0.250
3,mlp.up_proj,334.65601,0.05000,0.267
3,mlp.gate_proj,592.50232,0.05000,0.276
3,mlp.down_proj,152.53775,0.05000,1.373
4,self_attn.k_proj,12.77439,0.05000,0.239
4,self_attn.v_proj,5.69861,0.05000,0.240
4,self_attn.q_proj,61.66964,0.05000,0.244
4,self_attn.o_proj,1.54178,0.05000,0.243
4,mlp.up_proj,202.40878,0.05000,0.260
4,mlp.gate_proj,317.82367,0.05000,0.263
4,mlp.down_proj,2.41736,0.05000,1.319
5,self_attn.k_proj,14.18274,0.05000,0.238
5,self_attn.v_proj,6.86500,0.05000,0.241
5,self_attn.q_proj,69.48232,0.05000,0.253
5,self_attn.o_proj,0.91597,0.05000,0.254
5,mlp.up_proj,250.59880,0.05000,0.259
5,mlp.gate_proj,503.84485,0.05000,0.279
5,mlp.down_proj,2.38952,0.05000,1.385
6,self_attn.k_proj,13.24366,0.05000,0.249
6,self_attn.v_proj,3.92612,0.05000,0.244
6,self_attn.q_proj,57.82330,0.05000,0.256
6,self_attn.o_proj,0.82199,0.05000,0.248
6,mlp.up_proj,202.01077,0.05000,0.260
6,mlp.gate_proj,291.08887,0.05000,0.263
6,mlp.down_proj,2.34200,0.05000,1.317
7,self_attn.k_proj,20.47707,0.05000,0.236
7,self_attn.v_proj,6.82208,0.05000,0.244
7,self_attn.q_proj,83.89909,0.05000,0.245
7,self_attn.o_proj,1.38920,0.05000,0.239
7,mlp.up_proj,215.59988,0.05000,0.260
7,mlp.gate_proj,279.67908,0.05000,0.263
7,mlp.down_proj,2.72322,0.05000,1.318
8,self_attn.k_proj,15.35229,0.05000,0.240
8,self_attn.v_proj,5.31779,0.05000,0.242
8,self_attn.q_proj,72.20273,0.05000,0.243
8,self_attn.o_proj,2.27721,0.05000,0.250
8,mlp.up_proj,190.38971,0.05000,0.262
8,mlp.gate_proj,251.40579,0.05000,0.269
8,mlp.down_proj,1.84644,0.05000,1.402
9,self_attn.k_proj,46.89391,0.05000,0.242
9,self_attn.v_proj,12.24958,0.05000,0.245
9,self_attn.q_proj,185.18671,0.05000,0.245
9,self_attn.o_proj,1.13563,0.05000,0.239
9,mlp.up_proj,186.08925,0.05000,0.258
9,mlp.gate_proj,219.94760,0.05000,0.280
9,mlp.down_proj,1.89974,0.05000,1.314
10,self_attn.k_proj,12.25381,0.05000,0.236
10,self_attn.v_proj,8.53600,0.05000,0.240
10,self_attn.q_proj,61.72304,0.05000,0.244
10,self_attn.o_proj,2.15923,0.05000,0.244
10,mlp.up_proj,153.92357,0.05000,0.263
10,mlp.gate_proj,200.48236,0.05000,0.261
10,mlp.down_proj,1.46866,0.05000,1.325
11,self_attn.k_proj,47.32881,0.05000,0.236
11,self_attn.v_proj,12.32052,0.05000,0.236
11,self_attn.q_proj,172.02649,0.05000,0.241
11,self_attn.o_proj,0.99634,0.05000,0.240
11,mlp.up_proj,166.91438,0.05000,0.258
11,mlp.gate_proj,183.99411,0.05000,0.271
11,mlp.down_proj,2.20383,0.05000,1.308
12,self_attn.k_proj,10.70629,0.05000,0.234
12,self_attn.v_proj,6.82535,0.05000,0.237
12,self_attn.q_proj,58.90049,0.05000,0.240
12,self_attn.o_proj,2.06957,0.05000,0.240
12,mlp.up_proj,151.14467,0.05000,0.259
12,mlp.gate_proj,168.46320,0.05000,0.273
12,mlp.down_proj,1.57911,0.05000,1.320
13,self_attn.k_proj,20.42959,0.05000,0.237
13,self_attn.v_proj,8.33975,0.05000,0.237
13,self_attn.q_proj,100.85551,0.05000,0.243
13,self_attn.o_proj,1.29940,0.05000,0.243
13,mlp.up_proj,167.68123,0.05000,0.257
13,mlp.gate_proj,170.36960,0.05000,0.267
13,mlp.down_proj,1.88119,0.05000,1.320
14,self_attn.k_proj,12.73074,0.05000,0.240
14,self_attn.v_proj,11.76164,0.05000,0.237
14,self_attn.q_proj,77.89767,0.05000,0.240
14,self_attn.o_proj,3.52199,0.05000,0.241
14,mlp.up_proj,163.05870,0.05000,0.254
14,mlp.gate_proj,184.55475,0.05000,0.260
14,mlp.down_proj,2.35992,0.05000,1.309
15,self_attn.k_proj,13.67384,0.05000,0.233
15,self_attn.v_proj,9.17948,0.05000,0.236
15,self_attn.q_proj,67.20424,0.05000,0.241
15,self_attn.o_proj,2.04910,0.05000,0.239
15,mlp.up_proj,210.13235,0.05000,0.274
15,mlp.gate_proj,220.19116,0.05000,0.269
15,mlp.down_proj,3.57103,0.05000,1.396
16,self_attn.k_proj,29.70275,0.05000,0.244
16,self_attn.v_proj,24.40463,0.05000,0.251
16,self_attn.q_proj,166.54938,0.05000,0.241
16,self_attn.o_proj,1.16431,0.05000,0.251
16,mlp.up_proj,267.70422,0.05000,0.272
16,mlp.gate_proj,344.47858,0.05000,0.266
16,mlp.down_proj,7.87296,0.05000,1.311
17,self_attn.k_proj,15.50768,0.05000,0.233
17,self_attn.v_proj,14.58982,0.05000,0.236
17,self_attn.q_proj,101.04700,0.05000,0.241
17,self_attn.o_proj,1.79011,0.05000,0.240
17,mlp.up_proj,316.87897,0.05000,0.268
17,mlp.gate_proj,487.06854,0.05000,0.274
17,mlp.down_proj,5.82991,0.05000,1.393
18,self_attn.k_proj,16.92690,0.05000,0.250
18,self_attn.v_proj,14.79226,0.05000,0.245
18,self_attn.q_proj,90.39028,0.05000,0.245
18,self_attn.o_proj,2.17428,0.05000,0.245
18,mlp.up_proj,308.24667,0.05000,0.257
18,mlp.gate_proj,386.23010,0.05000,0.265
18,mlp.down_proj,5.66360,0.05000,1.328
19,self_attn.k_proj,15.91953,0.05000,0.239
19,self_attn.v_proj,15.05818,0.05000,0.239
19,self_attn.q_proj,97.57352,0.05000,0.242
19,self_attn.o_proj,2.65458,0.05000,0.240
19,mlp.up_proj,457.87988,0.05000,0.259
19,mlp.gate_proj,545.14697,0.05000,0.265
19,mlp.down_proj,13.83433,0.05000,1.321
20,self_attn.k_proj,21.35356,0.05000,0.237
20,self_attn.v_proj,44.00055,0.05000,0.240
20,self_attn.q_proj,143.75569,0.05000,0.246
20,self_attn.o_proj,5.11928,0.05000,0.246
20,mlp.up_proj,495.64117,0.05000,0.258
20,mlp.gate_proj,540.19043,0.05000,0.268
20,mlp.down_proj,19.63391,0.05000,1.315
21,self_attn.k_proj,23.84112,0.05000,0.238
21,self_attn.v_proj,72.92213,0.05000,0.239
21,self_attn.q_proj,177.69803,0.05000,0.242
21,self_attn.o_proj,12.85544,0.05000,0.241
21,mlp.up_proj,554.14130,0.05000,0.257
21,mlp.gate_proj,570.48572,0.05000,0.268
21,mlp.down_proj,196.02072,0.05000,1.320
22,self_attn.k_proj,22.17667,0.05000,0.237
22,self_attn.v_proj,66.65771,0.05000,0.239
22,self_attn.q_proj,167.72662,0.05000,0.245
22,self_attn.o_proj,2.24238,0.05000,0.242
22,mlp.up_proj,406.67615,0.05000,0.259
22,mlp.gate_proj,387.07877,0.05000,0.265
22,mlp.down_proj,31.63613,0.05000,1.329
23,self_attn.k_proj,27.19038,0.05000,0.237
23,self_attn.v_proj,55.59654,0.05000,0.240
23,self_attn.q_proj,218.93060,0.05000,0.243
23,self_attn.o_proj,13.96109,0.05000,0.238
23,mlp.up_proj,507.27164,0.05000,0.255
23,mlp.gate_proj,520.63934,0.05000,0.262
23,mlp.down_proj,124.49292,0.05000,1.328