File size: 12,583 Bytes
0b7ff43
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.00070515,0.01000,1.385
0,self_attn.v_proj,0.00059307,0.01000,1.121
0,self_attn.q_proj,0.00258521,0.01000,1.172
0,self_attn.o_proj,0.01955252,0.01000,1.172
0,mlp.up_proj,0.14081547,0.01000,1.232
0,mlp.gate_proj,0.21270670,0.01000,1.184
0,mlp.down_proj,0.10341728,0.01000,5.008
1,self_attn.k_proj,0.00179484,0.01000,1.179
1,self_attn.v_proj,0.00185646,0.01000,1.124
1,self_attn.q_proj,0.00755967,0.01000,1.148
1,self_attn.o_proj,0.01750864,0.01000,1.186
1,mlp.up_proj,1.93339133,0.01000,1.241
1,mlp.gate_proj,6.46621895,0.01000,1.194
1,mlp.down_proj,0.24397323,0.01000,5.021
2,self_attn.k_proj,0.00402845,0.01000,1.159
2,self_attn.v_proj,0.00421844,0.01000,1.105
2,self_attn.q_proj,0.01554210,0.01000,1.128
2,self_attn.o_proj,0.03608973,0.01000,1.185
2,mlp.up_proj,4.04899502,0.01000,1.237
2,mlp.gate_proj,8.89684391,0.01000,1.193
2,mlp.down_proj,0.22869286,0.01000,5.269
3,self_attn.k_proj,0.00834207,0.01000,1.177
3,self_attn.v_proj,0.00874612,0.01000,1.128
3,self_attn.q_proj,0.03258161,0.01000,1.150
3,self_attn.o_proj,0.04409736,0.01000,1.186
3,mlp.up_proj,6.68514776,0.01000,1.248
3,mlp.gate_proj,15.11703968,0.01000,1.198
3,mlp.down_proj,0.36655888,0.01000,5.079
4,self_attn.k_proj,0.01444592,0.01000,1.173
4,self_attn.v_proj,0.01500741,0.01000,1.124
4,self_attn.q_proj,0.05909440,0.01000,1.146
4,self_attn.o_proj,0.06205442,0.01000,1.186
4,mlp.up_proj,13.67866325,0.01000,1.243
4,mlp.gate_proj,23.40497398,0.01000,1.194
4,mlp.down_proj,0.41648334,0.01000,5.070
5,self_attn.k_proj,0.01607831,0.01000,1.166
5,self_attn.v_proj,0.01557913,0.01000,1.172
5,self_attn.q_proj,0.06674744,0.01000,1.141
5,self_attn.o_proj,0.07189713,0.01000,1.191
5,mlp.up_proj,10.08458900,0.01000,1.240
5,mlp.gate_proj,25.65925598,0.01000,1.196
5,mlp.down_proj,0.72814405,0.01000,5.078
6,self_attn.k_proj,0.02797525,0.01000,1.180
6,self_attn.v_proj,0.02999315,0.01000,1.124
6,self_attn.q_proj,0.11771373,0.01000,1.149
6,self_attn.o_proj,0.10042808,0.01000,1.207
6,mlp.up_proj,22.71648407,0.01000,1.237
6,mlp.gate_proj,43.64604950,0.01000,1.202
6,mlp.down_proj,55.64929581,0.01000,5.161
7,self_attn.k_proj,0.11195987,0.01000,1.207
7,self_attn.v_proj,0.12252167,0.01000,1.138
7,self_attn.q_proj,0.49221504,0.01000,1.171
7,self_attn.o_proj,0.22399020,0.01000,1.270
7,mlp.up_proj,19.27217484,0.01000,1.261
7,mlp.gate_proj,40.91525650,0.01000,1.273
7,mlp.down_proj,1.07534313,0.01000,5.317
8,self_attn.k_proj,0.12188863,0.01000,1.208
8,self_attn.v_proj,0.14043301,0.01000,1.150
8,self_attn.q_proj,0.52052939,0.01000,1.178
8,self_attn.o_proj,0.24562880,0.01000,1.208
8,mlp.up_proj,7.53962708,0.01000,1.258
8,mlp.gate_proj,13.18854618,0.01000,1.213
8,mlp.down_proj,1.41018748,0.01000,5.144
9,self_attn.k_proj,0.08431721,0.01000,1.234
9,self_attn.v_proj,0.07946551,0.01000,1.142
9,self_attn.q_proj,0.35178173,0.01000,1.163
9,self_attn.o_proj,0.21273188,0.01000,1.203
9,mlp.up_proj,7.51564360,0.01000,1.257
9,mlp.gate_proj,8.31024075,0.01000,1.209
9,mlp.down_proj,1.97027135,0.01000,5.389
10,self_attn.k_proj,0.13970166,0.01000,1.189
10,self_attn.v_proj,0.15342611,0.01000,1.234
10,self_attn.q_proj,0.60267645,0.01000,1.171
10,self_attn.o_proj,0.36029112,0.01000,1.272
10,mlp.up_proj,8.76702881,0.01000,1.317
10,mlp.gate_proj,9.45533562,0.01000,1.285
10,mlp.down_proj,1.95001364,0.01000,5.389
11,self_attn.k_proj,0.22548521,0.01000,1.192
11,self_attn.v_proj,0.23918489,0.01000,1.141
11,self_attn.q_proj,0.96112633,0.01000,1.161
11,self_attn.o_proj,0.64858180,0.01000,1.272
11,mlp.up_proj,10.80723763,0.01000,1.253
11,mlp.gate_proj,11.55856419,0.01000,1.207
11,mlp.down_proj,2.57149935,0.01000,5.577
12,self_attn.k_proj,0.19354048,0.01000,1.188
12,self_attn.v_proj,0.19336683,0.01000,1.143
12,self_attn.q_proj,0.81618583,0.01000,1.180
12,self_attn.o_proj,0.62866342,0.01000,1.198
12,mlp.up_proj,12.84583282,0.01000,1.271
12,mlp.gate_proj,13.82784271,0.01000,1.221
12,mlp.down_proj,3.34642506,0.01000,5.156
13,self_attn.k_proj,0.42784294,0.01000,1.198
13,self_attn.v_proj,0.46224689,0.01000,1.143
13,self_attn.q_proj,1.86821342,0.01000,1.167
13,self_attn.o_proj,1.11543632,0.01000,1.197
13,mlp.up_proj,14.57806587,0.01000,1.250
13,mlp.gate_proj,16.80974579,0.01000,1.202
13,mlp.down_proj,3.90047622,0.01000,5.149
14,self_attn.k_proj,0.30829912,0.01000,1.198
14,self_attn.v_proj,0.32090122,0.01000,1.148
14,self_attn.q_proj,1.31513786,0.01000,1.188
14,self_attn.o_proj,1.03302169,0.01000,1.200
14,mlp.up_proj,14.98736763,0.01000,1.282
14,mlp.gate_proj,16.62957382,0.01000,1.281
14,mlp.down_proj,4.07754374,0.01000,5.408
15,self_attn.k_proj,0.29759282,0.01000,1.200
15,self_attn.v_proj,0.29929948,0.01000,1.155
15,self_attn.q_proj,1.26697755,0.01000,1.172
15,self_attn.o_proj,0.93979216,0.01000,1.206
15,mlp.up_proj,15.57353783,0.01000,1.258
15,mlp.gate_proj,16.22858429,0.01000,1.210
15,mlp.down_proj,4.35530853,0.01000,5.379
16,self_attn.k_proj,0.37539023,0.01000,1.211
16,self_attn.v_proj,0.40242690,0.01000,1.188
16,self_attn.q_proj,1.57348514,0.01000,1.164
16,self_attn.o_proj,1.27471220,0.01000,1.221
16,mlp.up_proj,14.90924168,0.01000,1.265
16,mlp.gate_proj,14.57688999,0.01000,1.254
16,mlp.down_proj,4.53259277,0.01000,5.613
17,self_attn.k_proj,0.39300671,0.01000,1.238
17,self_attn.v_proj,0.40721723,0.01000,1.254
17,self_attn.q_proj,1.74801767,0.01000,1.281
17,self_attn.o_proj,1.37048018,0.01000,1.276
17,mlp.up_proj,16.27043724,0.01000,1.324
17,mlp.gate_proj,15.69502831,0.01000,1.274
17,mlp.down_proj,4.69274473,0.01000,5.326
18,self_attn.k_proj,0.56768882,0.01000,1.254
18,self_attn.v_proj,0.58766353,0.01000,1.206
18,self_attn.q_proj,2.51605034,0.01000,1.226
18,self_attn.o_proj,1.34994674,0.01000,1.279
18,mlp.up_proj,17.51553345,0.01000,1.301
18,mlp.gate_proj,16.32071114,0.01000,1.243
18,mlp.down_proj,5.31907988,0.01000,5.185
19,self_attn.k_proj,0.78620756,0.01000,1.265
19,self_attn.v_proj,0.81862819,0.01000,1.223
19,self_attn.q_proj,3.35753012,0.01000,1.248
19,self_attn.o_proj,1.61737394,0.01000,1.276
19,mlp.up_proj,19.24126816,0.01000,1.260
19,mlp.gate_proj,18.14963341,0.01000,1.271
19,mlp.down_proj,16.54980850,0.01000,5.439
20,self_attn.k_proj,1.43805170,0.01000,1.279
20,self_attn.v_proj,1.62246335,0.01000,1.220
20,self_attn.q_proj,6.66899490,0.01000,1.245
20,self_attn.o_proj,2.46310806,0.01000,1.201
20,mlp.up_proj,20.68938828,0.01000,1.266
20,mlp.gate_proj,19.20712280,0.01000,1.212
20,mlp.down_proj,7.44412184,0.01000,5.173
21,self_attn.k_proj,1.47485924,0.01000,1.214
21,self_attn.v_proj,1.44628322,0.01000,1.172
21,self_attn.q_proj,6.17815638,0.01000,1.199
21,self_attn.o_proj,3.53289413,0.01000,1.277
21,mlp.up_proj,22.05725479,0.01000,1.293
21,mlp.gate_proj,20.82827759,0.01000,1.230
21,mlp.down_proj,8.68605137,0.01000,5.657
22,self_attn.k_proj,1.44943690,0.01000,1.189
22,self_attn.v_proj,1.64447689,0.01000,1.138
22,self_attn.q_proj,6.54392338,0.01000,1.163
22,self_attn.o_proj,3.19042945,0.01000,1.196
22,mlp.up_proj,24.60332108,0.01000,1.252
22,mlp.gate_proj,23.00504684,0.01000,1.206
22,mlp.down_proj,9.71904182,0.01000,5.351
23,self_attn.k_proj,2.18464589,0.01000,1.190
23,self_attn.v_proj,2.59843898,0.01000,1.139
23,self_attn.q_proj,10.36781311,0.01000,1.162
23,self_attn.o_proj,2.85652900,0.01000,1.191
23,mlp.up_proj,25.49422836,0.01000,1.325
23,mlp.gate_proj,23.43290138,0.01000,1.289
23,mlp.down_proj,11.47138596,0.01000,5.225
24,self_attn.k_proj,2.77395487,0.01000,1.258
24,self_attn.v_proj,3.21030664,0.01000,1.207
24,self_attn.q_proj,13.67599678,0.01000,1.229
24,self_attn.o_proj,4.96184969,0.01000,1.273
24,mlp.up_proj,27.81478119,0.01000,1.267
24,mlp.gate_proj,26.07052231,0.01000,1.219
24,mlp.down_proj,12.45972443,0.01000,5.404
25,self_attn.k_proj,2.77749777,0.01000,1.225
25,self_attn.v_proj,3.10713243,0.01000,1.174
25,self_attn.q_proj,12.99405098,0.01000,1.177
25,self_attn.o_proj,4.33352947,0.01000,1.236
25,mlp.up_proj,30.71481323,0.01000,1.303
25,mlp.gate_proj,29.03659439,0.01000,1.212
25,mlp.down_proj,15.96378517,0.01000,5.203
26,self_attn.k_proj,3.00112486,0.01000,1.196
26,self_attn.v_proj,3.52014399,0.01000,1.144
26,self_attn.q_proj,14.48973846,0.01000,1.170
26,self_attn.o_proj,4.95573711,0.01000,1.204
26,mlp.up_proj,34.63649368,0.01000,1.258
26,mlp.gate_proj,33.71157837,0.01000,1.213
26,mlp.down_proj,24.53585052,0.01000,5.392
27,self_attn.k_proj,4.64402103,0.01000,1.284
27,self_attn.v_proj,5.38009834,0.01000,1.139
27,self_attn.q_proj,21.22321701,0.01000,1.161
27,self_attn.o_proj,8.20958328,0.01000,1.190
27,mlp.up_proj,42.48213577,0.01000,1.255
27,mlp.gate_proj,41.43994904,0.01000,1.205
27,mlp.down_proj,35.94324112,0.01000,5.184
28,self_attn.k_proj,7.01647139,0.01000,1.188
28,self_attn.v_proj,8.68221283,0.01000,1.138
28,self_attn.q_proj,33.62464905,0.01000,1.161
28,self_attn.o_proj,10.86140060,0.01000,1.195
28,mlp.up_proj,53.62960052,0.01000,1.254
28,mlp.gate_proj,51.62405777,0.01000,1.208
28,mlp.down_proj,46.18000793,0.01000,5.157
29,self_attn.k_proj,10.72468376,0.01000,1.193
29,self_attn.v_proj,11.93986320,0.01000,1.186
29,self_attn.q_proj,49.06664658,0.01000,1.157
29,self_attn.o_proj,9.47833252,0.01000,1.215
29,mlp.up_proj,60.01675797,0.01000,1.259
29,mlp.gate_proj,57.49778748,0.01000,1.211
29,mlp.down_proj,66.30590820,0.01000,5.373
30,self_attn.k_proj,16.15894699,0.01000,1.194
30,self_attn.v_proj,20.22811890,0.01000,1.148
30,self_attn.q_proj,72.88484192,0.01000,1.168
30,self_attn.o_proj,17.97172165,0.01000,1.201
30,mlp.up_proj,77.35546875,0.01000,1.258
30,mlp.gate_proj,73.98342133,0.01000,1.215
30,mlp.down_proj,80.41363525,0.01000,5.146
31,self_attn.k_proj,16.20863724,0.01000,1.197
31,self_attn.v_proj,17.44694710,0.01000,1.148
31,self_attn.q_proj,71.93412018,0.01000,1.170
31,self_attn.o_proj,15.64772701,0.01000,1.271
31,mlp.up_proj,84.93713379,0.01000,1.329
31,mlp.gate_proj,79.64702606,0.01000,1.266
31,mlp.down_proj,102.10330963,0.01000,5.332
32,self_attn.k_proj,30.03628540,0.01000,1.195
32,self_attn.v_proj,39.24974823,0.01000,1.158
32,self_attn.q_proj,132.09585571,0.01000,1.170
32,self_attn.o_proj,16.91402435,0.01000,1.204
32,mlp.up_proj,97.01721954,0.01000,1.331
32,mlp.gate_proj,89.70504761,0.01000,1.293
32,mlp.down_proj,119.89739990,0.01000,5.660
33,self_attn.k_proj,37.31489944,0.01000,1.247
33,self_attn.v_proj,54.59365082,0.01000,1.219
33,self_attn.q_proj,164.40927124,0.01000,1.245
33,self_attn.o_proj,19.79536247,0.01000,1.270
33,mlp.up_proj,104.77709198,0.01000,1.325
33,mlp.gate_proj,94.75755310,0.01000,1.279
33,mlp.down_proj,140.76945496,0.01000,5.166
34,self_attn.k_proj,67.91184998,0.01000,1.190
34,self_attn.v_proj,88.80003357,0.01000,1.139
34,self_attn.q_proj,298.65936279,0.01000,1.165
34,self_attn.o_proj,25.28427124,0.01000,1.197
34,mlp.up_proj,118.75723267,0.01000,1.255
34,mlp.gate_proj,105.32444000,0.01000,1.219
34,mlp.down_proj,166.93191528,0.01000,5.414
35,self_attn.k_proj,88.77953339,0.01000,1.293
35,self_attn.v_proj,130.98645020,0.01000,1.221
35,self_attn.q_proj,409.77334595,0.01000,1.170
35,self_attn.o_proj,25.57363319,0.01000,1.293
35,mlp.up_proj,128.79974365,0.01000,1.258
35,mlp.gate_proj,112.65682983,0.01000,1.212
35,mlp.down_proj,207.04046631,0.01000,5.163
36,self_attn.k_proj,83.83846283,0.01000,1.198
36,self_attn.v_proj,105.56782532,0.01000,1.146
36,self_attn.q_proj,385.79064941,0.01000,1.169
36,self_attn.o_proj,52.55107117,0.01000,1.204
36,mlp.up_proj,139.16838074,0.01000,1.259
36,mlp.gate_proj,118.08029938,0.01000,1.213
36,mlp.down_proj,276.03088379,0.01000,5.362
37,self_attn.k_proj,107.06826782,0.01000,1.199
37,self_attn.v_proj,182.47669983,0.01000,1.144
37,self_attn.q_proj,516.48419189,0.01000,1.173
37,self_attn.o_proj,67.11089325,0.01000,1.206
37,mlp.up_proj,146.49134827,0.01000,1.256
37,mlp.gate_proj,122.33524323,0.01000,1.212
37,mlp.down_proj,372.25158691,0.01000,5.430
38,self_attn.k_proj,117.78956604,0.01000,1.198
38,self_attn.v_proj,178.97363281,0.01000,1.149
38,self_attn.q_proj,535.84649658,0.01000,1.171
38,self_attn.o_proj,128.42825317,0.01000,1.201
38,mlp.up_proj,165.81509399,0.01000,1.263
38,mlp.gate_proj,146.40844727,0.01000,1.216
38,mlp.down_proj,547.92755127,0.01000,5.405
39,self_attn.k_proj,54.57062149,0.01000,1.236
39,self_attn.v_proj,73.58613586,0.01000,1.202
39,self_attn.q_proj,241.50205994,0.01000,1.173
39,self_attn.o_proj,100.98907471,0.01000,1.230
39,mlp.up_proj,214.80130005,0.01000,1.248
39,mlp.gate_proj,195.37448120,0.01000,1.197
39,mlp.down_proj,1378.51818848,0.01000,5.398