File size: 12,584 Bytes
0ab2b87
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.00070691,0.01000,1.432
0,self_attn.v_proj,0.00059318,0.01000,1.071
0,self_attn.q_proj,0.00259039,0.01000,1.131
0,self_attn.o_proj,0.01872325,0.01000,1.265
0,mlp.up_proj,0.13378978,0.01000,1.312
0,mlp.gate_proj,0.20375231,0.01000,1.255
0,mlp.down_proj,0.10015747,0.01000,5.321
1,self_attn.k_proj,0.00169902,0.01000,1.261
1,self_attn.v_proj,0.00176455,0.01000,1.207
1,self_attn.q_proj,0.00715574,0.01000,1.230
1,self_attn.o_proj,0.01774971,0.01000,1.265
1,mlp.up_proj,1.87754011,0.01000,1.298
1,mlp.gate_proj,6.26215172,0.01000,1.256
1,mlp.down_proj,0.23886812,0.01000,5.342
2,self_attn.k_proj,0.00389131,0.01000,1.255
2,self_attn.v_proj,0.00406967,0.01000,1.210
2,self_attn.q_proj,0.01501170,0.01000,1.239
2,self_attn.o_proj,0.03605750,0.01000,1.265
2,mlp.up_proj,3.97210836,0.01000,1.324
2,mlp.gate_proj,8.70841980,0.01000,1.272
2,mlp.down_proj,0.23816061,0.01000,5.355
3,self_attn.k_proj,0.00815293,0.01000,1.256
3,self_attn.v_proj,0.00853108,0.01000,1.205
3,self_attn.q_proj,0.03172233,0.01000,1.235
3,self_attn.o_proj,0.04524668,0.01000,1.268
3,mlp.up_proj,6.54533100,0.01000,1.322
3,mlp.gate_proj,14.77986145,0.01000,1.279
3,mlp.down_proj,0.37597522,0.01000,5.353
4,self_attn.k_proj,0.01413451,0.01000,1.259
4,self_attn.v_proj,0.01470964,0.01000,1.208
4,self_attn.q_proj,0.05791626,0.01000,1.237
4,self_attn.o_proj,0.06184003,0.01000,1.259
4,mlp.up_proj,13.34243965,0.01000,1.319
4,mlp.gate_proj,22.78504181,0.01000,1.278
4,mlp.down_proj,0.41737747,0.01000,5.333
5,self_attn.k_proj,0.01564825,0.01000,1.198
5,self_attn.v_proj,0.01523696,0.01000,1.207
5,self_attn.q_proj,0.06512326,0.01000,1.232
5,self_attn.o_proj,0.07203308,0.01000,1.261
5,mlp.up_proj,9.74938202,0.01000,1.334
5,mlp.gate_proj,24.67286491,0.01000,1.288
5,mlp.down_proj,0.70431685,0.01000,5.366
6,self_attn.k_proj,0.02744503,0.01000,1.253
6,self_attn.v_proj,0.02941702,0.01000,1.200
6,self_attn.q_proj,0.11530104,0.01000,1.225
6,self_attn.o_proj,0.09900515,0.01000,1.250
6,mlp.up_proj,22.07820129,0.01000,1.324
6,mlp.gate_proj,42.23360825,0.01000,1.274
6,mlp.down_proj,36.56550598,0.01000,5.427
7,self_attn.k_proj,0.11009024,0.01000,1.256
7,self_attn.v_proj,0.12083898,0.01000,1.205
7,self_attn.q_proj,0.48473150,0.01000,1.228
7,self_attn.o_proj,0.21330884,0.01000,1.267
7,mlp.up_proj,19.00367928,0.01000,1.326
7,mlp.gate_proj,40.35453033,0.01000,1.284
7,mlp.down_proj,1.01973176,0.01000,5.351
8,self_attn.k_proj,0.12112961,0.01000,1.260
8,self_attn.v_proj,0.13909948,0.01000,1.211
8,self_attn.q_proj,0.51785636,0.01000,1.233
8,self_attn.o_proj,0.23820072,0.01000,1.246
8,mlp.up_proj,7.41920280,0.01000,1.321
8,mlp.gate_proj,12.94360542,0.01000,1.273
8,mlp.down_proj,1.39439631,0.01000,5.409
9,self_attn.k_proj,0.08409639,0.01000,1.260
9,self_attn.v_proj,0.07808492,0.01000,1.217
9,self_attn.q_proj,0.34646398,0.01000,1.237
9,self_attn.o_proj,0.21907786,0.01000,1.254
9,mlp.up_proj,7.39851189,0.01000,1.319
9,mlp.gate_proj,8.18926239,0.01000,1.260
9,mlp.down_proj,1.94643378,0.01000,5.393
10,self_attn.k_proj,0.13818432,0.01000,1.269
10,self_attn.v_proj,0.15041357,0.01000,1.217
10,self_attn.q_proj,0.59162092,0.01000,1.233
10,self_attn.o_proj,0.35141155,0.01000,1.270
10,mlp.up_proj,8.58759117,0.01000,1.316
10,mlp.gate_proj,9.27396202,0.01000,1.280
10,mlp.down_proj,1.90882754,0.01000,5.004
11,self_attn.k_proj,0.22031164,0.01000,1.165
11,self_attn.v_proj,0.23452374,0.01000,1.086
11,self_attn.q_proj,0.94158274,0.01000,1.112
11,self_attn.o_proj,0.64426076,0.01000,1.192
11,mlp.up_proj,10.57266903,0.01000,1.205
11,mlp.gate_proj,11.31605530,0.01000,1.159
11,mlp.down_proj,2.49773169,0.01000,5.220
12,self_attn.k_proj,0.18946378,0.01000,1.137
12,self_attn.v_proj,0.18944678,0.01000,1.085
12,self_attn.q_proj,0.79821730,0.01000,1.108
12,self_attn.o_proj,0.60696584,0.01000,1.144
12,mlp.up_proj,12.56937885,0.01000,1.203
12,mlp.gate_proj,13.53184891,0.01000,1.158
12,mlp.down_proj,3.26138687,0.01000,4.992
13,self_attn.k_proj,0.41855329,0.01000,1.131
13,self_attn.v_proj,0.45423627,0.01000,1.081
13,self_attn.q_proj,1.83529305,0.01000,1.108
13,self_attn.o_proj,1.04172182,0.01000,1.142
13,mlp.up_proj,14.25735474,0.01000,1.206
13,mlp.gate_proj,16.45092010,0.01000,1.161
13,mlp.down_proj,3.83712721,0.01000,5.036
14,self_attn.k_proj,0.30206871,0.01000,1.151
14,self_attn.v_proj,0.31481010,0.01000,1.082
14,self_attn.q_proj,1.28473377,0.01000,1.107
14,self_attn.o_proj,1.00593269,0.01000,1.140
14,mlp.up_proj,14.68998814,0.01000,1.203
14,mlp.gate_proj,16.29914665,0.01000,1.158
14,mlp.down_proj,4.08327484,0.01000,4.999
15,self_attn.k_proj,0.29286253,0.01000,1.133
15,self_attn.v_proj,0.29624963,0.01000,1.081
15,self_attn.q_proj,1.24898148,0.01000,1.107
15,self_attn.o_proj,0.94168097,0.01000,1.143
15,mlp.up_proj,15.44438839,0.01000,1.208
15,mlp.gate_proj,16.09203911,0.01000,1.160
15,mlp.down_proj,4.34994030,0.01000,5.222
16,self_attn.k_proj,0.37170666,0.01000,1.140
16,self_attn.v_proj,0.39827538,0.01000,1.091
16,self_attn.q_proj,1.55861425,0.01000,1.118
16,self_attn.o_proj,1.24285769,0.01000,1.150
16,mlp.up_proj,14.82378101,0.01000,1.211
16,mlp.gate_proj,14.50064278,0.01000,1.166
16,mlp.down_proj,4.47918606,0.01000,5.239
17,self_attn.k_proj,0.39052096,0.01000,1.138
17,self_attn.v_proj,0.40798220,0.01000,1.089
17,self_attn.q_proj,1.74031353,0.01000,1.115
17,self_attn.o_proj,1.37823784,0.01000,1.151
17,mlp.up_proj,16.17243195,0.01000,1.211
17,mlp.gate_proj,15.60438156,0.01000,1.168
17,mlp.down_proj,4.64399624,0.01000,5.047
18,self_attn.k_proj,0.56799269,0.01000,1.138
18,self_attn.v_proj,0.58997786,0.01000,1.090
18,self_attn.q_proj,2.52048039,0.01000,1.115
18,self_attn.o_proj,1.32625484,0.01000,1.150
18,mlp.up_proj,17.34894753,0.01000,1.213
18,mlp.gate_proj,16.16296387,0.01000,1.166
18,mlp.down_proj,5.24123001,0.01000,5.028
19,self_attn.k_proj,0.78765279,0.01000,1.139
19,self_attn.v_proj,0.82200253,0.01000,1.090
19,self_attn.q_proj,3.36882591,0.01000,1.115
19,self_attn.o_proj,1.56877732,0.01000,1.150
19,mlp.up_proj,19.31034660,0.01000,1.214
19,mlp.gate_proj,18.24939346,0.01000,1.171
19,mlp.down_proj,19.38244438,0.01000,5.262
20,self_attn.k_proj,1.45878661,0.01000,1.140
20,self_attn.v_proj,1.65540659,0.01000,1.089
20,self_attn.q_proj,6.76156139,0.01000,1.172
20,self_attn.o_proj,2.54323125,0.01000,1.148
20,mlp.up_proj,20.89072037,0.01000,1.210
20,mlp.gate_proj,19.40013504,0.01000,1.200
20,mlp.down_proj,7.72142410,0.01000,5.028
21,self_attn.k_proj,1.53237510,0.01000,1.164
21,self_attn.v_proj,1.50878608,0.01000,1.111
21,self_attn.q_proj,6.41003466,0.01000,1.137
21,self_attn.o_proj,3.52649236,0.01000,1.175
21,mlp.up_proj,22.51968193,0.01000,1.235
21,mlp.gate_proj,21.30210114,0.01000,1.188
21,mlp.down_proj,9.00376606,0.01000,5.328
22,self_attn.k_proj,1.50288391,0.01000,1.163
22,self_attn.v_proj,1.69944835,0.01000,1.112
22,self_attn.q_proj,6.75498009,0.01000,1.140
22,self_attn.o_proj,3.26820421,0.01000,1.171
22,mlp.up_proj,25.29592514,0.01000,1.233
22,mlp.gate_proj,23.66239738,0.01000,1.188
22,mlp.down_proj,10.19321442,0.01000,5.648
23,self_attn.k_proj,2.24442339,0.01000,1.268
23,self_attn.v_proj,2.68446589,0.01000,1.216
23,self_attn.q_proj,10.67938042,0.01000,1.242
23,self_attn.o_proj,3.14105654,0.01000,1.276
23,mlp.up_proj,26.03298187,0.01000,1.334
23,mlp.gate_proj,23.97613907,0.01000,1.284
23,mlp.down_proj,11.99122715,0.01000,5.401
24,self_attn.k_proj,2.86726427,0.01000,1.267
24,self_attn.v_proj,3.32556772,0.01000,1.217
24,self_attn.q_proj,14.12276649,0.01000,1.241
24,self_attn.o_proj,5.11100626,0.01000,1.274
24,mlp.up_proj,28.37653542,0.01000,1.260
24,mlp.gate_proj,26.66292572,0.01000,1.229
24,mlp.down_proj,13.03630733,0.01000,5.630
25,self_attn.k_proj,2.84071159,0.01000,1.262
25,self_attn.v_proj,3.18226862,0.01000,1.213
25,self_attn.q_proj,13.24620533,0.01000,1.240
25,self_attn.o_proj,4.53262854,0.01000,1.269
25,mlp.up_proj,31.11689377,0.01000,1.325
25,mlp.gate_proj,29.45091438,0.01000,1.286
25,mlp.down_proj,16.67062569,0.01000,5.422
26,self_attn.k_proj,3.04549980,0.01000,1.268
26,self_attn.v_proj,3.58924627,0.01000,1.216
26,self_attn.q_proj,14.70914555,0.01000,1.238
26,self_attn.o_proj,5.08626604,0.01000,1.265
26,mlp.up_proj,35.11465454,0.01000,1.316
26,mlp.gate_proj,34.20375061,0.01000,1.288
26,mlp.down_proj,25.85625839,0.01000,5.677
27,self_attn.k_proj,4.69784307,0.01000,1.265
27,self_attn.v_proj,5.43581915,0.01000,1.213
27,self_attn.q_proj,21.46455383,0.01000,1.243
27,self_attn.o_proj,8.64262867,0.01000,1.257
27,mlp.up_proj,43.07937622,0.01000,1.329
27,mlp.gate_proj,42.03904724,0.01000,1.287
27,mlp.down_proj,38.25311279,0.01000,5.469
28,self_attn.k_proj,7.11673689,0.01000,1.148
28,self_attn.v_proj,8.83921146,0.01000,1.116
28,self_attn.q_proj,34.02442169,0.01000,1.141
28,self_attn.o_proj,11.82533550,0.01000,1.174
28,mlp.up_proj,54.42869568,0.01000,1.232
28,mlp.gate_proj,52.42176819,0.01000,1.188
28,mlp.down_proj,49.26332855,0.01000,5.177
29,self_attn.k_proj,10.84047508,0.01000,1.163
29,self_attn.v_proj,12.13834381,0.01000,1.111
29,self_attn.q_proj,49.52957916,0.01000,1.138
29,self_attn.o_proj,10.24733162,0.01000,1.170
29,mlp.up_proj,60.64951324,0.01000,1.234
29,mlp.gate_proj,58.13564301,0.01000,1.186
29,mlp.down_proj,71.04278564,0.01000,5.106
30,self_attn.k_proj,16.40185928,0.01000,1.220
30,self_attn.v_proj,20.49968338,0.01000,1.166
30,self_attn.q_proj,73.70677185,0.01000,1.200
30,self_attn.o_proj,19.58269501,0.01000,1.223
30,mlp.up_proj,78.38506317,0.01000,1.234
30,mlp.gate_proj,75.07140350,0.01000,1.212
30,mlp.down_proj,87.20764160,0.01000,5.132
31,self_attn.k_proj,16.42351151,0.01000,1.163
31,self_attn.v_proj,17.66336060,0.01000,1.111
31,self_attn.q_proj,73.27272034,0.01000,1.137
31,self_attn.o_proj,16.64413071,0.01000,1.171
31,mlp.up_proj,85.86994171,0.01000,1.233
31,mlp.gate_proj,80.61709595,0.01000,1.188
31,mlp.down_proj,109.44659424,0.01000,5.097
32,self_attn.k_proj,30.33241653,0.01000,1.254
32,self_attn.v_proj,39.78414536,0.01000,1.202
32,self_attn.q_proj,133.13043213,0.01000,1.228
32,self_attn.o_proj,18.90437317,0.01000,1.255
32,mlp.up_proj,98.08085632,0.01000,1.335
32,mlp.gate_proj,90.71247101,0.01000,1.292
32,mlp.down_proj,127.88627625,0.01000,5.394
33,self_attn.k_proj,37.90292740,0.01000,1.187
33,self_attn.v_proj,55.42217255,0.01000,1.170
33,self_attn.q_proj,166.64010620,0.01000,1.141
33,self_attn.o_proj,22.74843788,0.01000,1.206
33,mlp.up_proj,105.96579742,0.01000,1.242
33,mlp.gate_proj,95.90925598,0.01000,1.193
33,mlp.down_proj,149.81369019,0.01000,5.191
34,self_attn.k_proj,68.69132233,0.01000,1.170
34,self_attn.v_proj,90.13403320,0.01000,1.119
34,self_attn.q_proj,302.74011230,0.01000,1.143
34,self_attn.o_proj,28.94225502,0.01000,1.177
34,mlp.up_proj,120.51785278,0.01000,1.239
34,mlp.gate_proj,107.01783752,0.01000,1.195
34,mlp.down_proj,177.52862549,0.01000,5.115
35,self_attn.k_proj,90.71392822,0.01000,1.167
35,self_attn.v_proj,136.07887268,0.01000,1.114
35,self_attn.q_proj,415.88043213,0.01000,1.140
35,self_attn.o_proj,31.15754509,0.01000,1.175
35,mlp.up_proj,130.15463257,0.01000,1.252
35,mlp.gate_proj,113.93470764,0.01000,1.190
35,mlp.down_proj,216.24749756,0.01000,5.104
36,self_attn.k_proj,84.99306488,0.01000,1.165
36,self_attn.v_proj,107.49351501,0.01000,1.111
36,self_attn.q_proj,390.38854980,0.01000,1.140
36,self_attn.o_proj,58.52774811,0.01000,1.173
36,mlp.up_proj,140.36920166,0.01000,1.232
36,mlp.gate_proj,119.18859863,0.01000,1.187
36,mlp.down_proj,287.48580933,0.01000,5.318
37,self_attn.k_proj,108.47268677,0.01000,1.135
37,self_attn.v_proj,184.89364624,0.01000,1.086
37,self_attn.q_proj,520.99499512,0.01000,1.109
37,self_attn.o_proj,69.65980530,0.01000,1.144
37,mlp.up_proj,146.33651733,0.01000,1.207
37,mlp.gate_proj,122.30540466,0.01000,1.159
37,mlp.down_proj,395.49780273,0.01000,5.252
38,self_attn.k_proj,118.53613281,0.01000,1.264
38,self_attn.v_proj,180.38798523,0.01000,1.214
38,self_attn.q_proj,537.27764893,0.01000,1.240
38,self_attn.o_proj,139.20002747,0.01000,1.269
38,mlp.up_proj,169.68232727,0.01000,1.326
38,mlp.gate_proj,149.87057495,0.01000,1.278
38,mlp.down_proj,664.65612793,0.01000,5.627
39,self_attn.k_proj,53.54238510,0.01000,1.252
39,self_attn.v_proj,72.11396790,0.01000,1.200
39,self_attn.q_proj,237.48791504,0.01000,1.229
39,self_attn.o_proj,106.63746643,0.01000,1.275
39,mlp.up_proj,189.89593506,0.01000,1.318
39,mlp.gate_proj,172.65310669,0.01000,1.279
39,mlp.down_proj,2550.65991211,0.01000,5.655