File size: 11,297 Bytes
156ad01
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.00084345,0.01000,1.223
0,self_attn.v_proj,0.00068146,0.01000,0.958
0,self_attn.q_proj,0.00272547,0.01000,0.984
0,self_attn.o_proj,0.01153205,0.01000,1.062
0,mlp.up_proj,0.42405057,0.01000,1.042
0,mlp.gate_proj,0.48233882,0.01000,0.937
0,mlp.down_proj,0.13682523,0.01000,3.343
1,self_attn.k_proj,0.00306148,0.01000,1.021
1,self_attn.v_proj,0.00326485,0.01000,0.906
1,self_attn.q_proj,0.01053650,0.01000,0.917
1,self_attn.o_proj,0.01707373,0.01000,0.997
1,mlp.up_proj,3.89274645,0.01000,1.041
1,mlp.gate_proj,9.81082344,0.01000,0.948
1,mlp.down_proj,0.13348961,0.01000,3.339
2,self_attn.k_proj,0.00752404,0.01000,1.020
2,self_attn.v_proj,0.00730450,0.01000,0.906
2,self_attn.q_proj,0.02552866,0.01000,0.912
2,self_attn.o_proj,0.01780433,0.01000,0.998
2,mlp.up_proj,14.60232544,0.01000,1.103
2,mlp.gate_proj,18.93645859,0.01000,1.006
2,mlp.down_proj,0.10283960,0.01000,3.530
3,self_attn.k_proj,0.01320747,0.01000,1.058
3,self_attn.v_proj,0.01355978,0.01000,0.910
3,self_attn.q_proj,0.04728362,0.01000,0.944
3,self_attn.o_proj,0.03009962,0.01000,1.070
3,mlp.up_proj,8.75980186,0.01000,1.088
3,mlp.gate_proj,18.95158386,0.01000,1.012
3,mlp.down_proj,0.26747733,0.01000,3.475
4,self_attn.k_proj,0.02939725,0.01000,1.028
4,self_attn.v_proj,0.03019872,0.01000,0.951
4,self_attn.q_proj,0.10273295,0.01000,0.954
4,self_attn.o_proj,0.05014657,0.01000,1.030
4,mlp.up_proj,8.47503471,0.01000,1.061
4,mlp.gate_proj,22.23841858,0.01000,0.973
4,mlp.down_proj,0.52693486,0.01000,3.355
5,self_attn.k_proj,0.02845209,0.01000,1.084
5,self_attn.v_proj,0.03015556,0.01000,0.964
5,self_attn.q_proj,0.10408959,0.01000,0.988
5,self_attn.o_proj,0.07308136,0.01000,1.040
5,mlp.up_proj,5.37897968,0.01000,1.080
5,mlp.gate_proj,11.83506584,0.01000,0.947
5,mlp.down_proj,0.80324954,0.01000,3.326
6,self_attn.k_proj,0.05283313,0.01000,1.029
6,self_attn.v_proj,0.05892858,0.01000,0.907
6,self_attn.q_proj,0.21134073,0.01000,0.916
6,self_attn.o_proj,0.19954075,0.01000,0.997
6,mlp.up_proj,7.63845062,0.01000,1.039
6,mlp.gate_proj,15.10716438,0.01000,0.944
6,mlp.down_proj,311.62054443,0.01250,3.485
7,self_attn.k_proj,0.13129912,0.01000,1.030
7,self_attn.v_proj,0.12965125,0.01000,0.917
7,self_attn.q_proj,0.46275425,0.01000,0.971
7,self_attn.o_proj,0.17884624,0.01000,1.029
7,mlp.up_proj,8.66279984,0.01000,1.053
7,mlp.gate_proj,15.46934700,0.01000,0.953
7,mlp.down_proj,1.09758997,0.01000,3.460
8,self_attn.k_proj,0.20556173,0.01000,1.088
8,self_attn.v_proj,0.21755575,0.01000,0.931
8,self_attn.q_proj,0.73550230,0.01000,0.956
8,self_attn.o_proj,0.30261898,0.01000,1.054
8,mlp.up_proj,8.12370586,0.01000,1.043
8,mlp.gate_proj,9.27283096,0.01000,0.963
8,mlp.down_proj,1.92112541,0.01000,3.371
9,self_attn.k_proj,0.27409315,0.01000,1.059
9,self_attn.v_proj,0.25618106,0.01000,0.955
9,self_attn.q_proj,0.94490111,0.01000,0.949
9,self_attn.o_proj,0.39467937,0.01000,1.032
9,mlp.up_proj,10.28509808,0.01000,1.078
9,mlp.gate_proj,13.92613983,0.01000,1.010
9,mlp.down_proj,2.22738075,0.01000,3.323
10,self_attn.k_proj,0.49247986,0.01000,1.031
10,self_attn.v_proj,0.55498147,0.01000,0.915
10,self_attn.q_proj,1.77565324,0.01000,0.925
10,self_attn.o_proj,0.56055677,0.01000,1.051
10,mlp.up_proj,10.15948582,0.01000,1.066
10,mlp.gate_proj,13.05847359,0.01000,0.954
10,mlp.down_proj,2.34822321,0.01000,3.362
11,self_attn.k_proj,0.25672472,0.01000,1.041
11,self_attn.v_proj,0.25923651,0.01000,0.915
11,self_attn.q_proj,0.89068496,0.01000,0.937
11,self_attn.o_proj,0.48962367,0.01000,1.081
11,mlp.up_proj,10.13054466,0.01000,1.054
11,mlp.gate_proj,11.94238186,0.01000,0.955
11,mlp.down_proj,2.27761793,0.01000,3.355
12,self_attn.k_proj,0.29361516,0.01000,1.025
12,self_attn.v_proj,0.31215677,0.01000,0.904
12,self_attn.q_proj,1.03035307,0.01000,0.909
12,self_attn.o_proj,0.62685263,0.01000,0.989
12,mlp.up_proj,10.65883636,0.01000,1.032
12,mlp.gate_proj,11.68334961,0.01000,0.929
12,mlp.down_proj,2.40802383,0.01000,3.305
13,self_attn.k_proj,0.23688897,0.01000,1.016
13,self_attn.v_proj,0.22963072,0.01000,0.903
13,self_attn.q_proj,0.86696172,0.01000,0.968
13,self_attn.o_proj,0.44055608,0.01000,0.990
13,mlp.up_proj,10.96124840,0.01000,1.034
13,mlp.gate_proj,11.14621544,0.01000,0.936
13,mlp.down_proj,2.69857836,0.01000,3.454
14,self_attn.k_proj,0.39485866,0.01000,1.015
14,self_attn.v_proj,0.41287988,0.01000,0.935
14,self_attn.q_proj,1.45101392,0.01000,0.909
14,self_attn.o_proj,0.84102076,0.01000,0.997
14,mlp.up_proj,11.08079338,0.01000,1.030
14,mlp.gate_proj,11.16698456,0.01000,0.931
14,mlp.down_proj,2.64587307,0.01000,3.301
15,self_attn.k_proj,0.41717225,0.01000,1.020
15,self_attn.v_proj,0.40285957,0.01000,0.896
15,self_attn.q_proj,1.49380088,0.01000,0.907
15,self_attn.o_proj,0.63534236,0.01000,0.983
15,mlp.up_proj,10.80261135,0.01000,1.032
15,mlp.gate_proj,10.46665287,0.01000,0.935
15,mlp.down_proj,2.73456883,0.01000,3.292
16,self_attn.k_proj,0.72424465,0.01000,1.014
16,self_attn.v_proj,0.82824504,0.01000,0.901
16,self_attn.q_proj,2.79787111,0.01000,0.911
16,self_attn.o_proj,0.90882635,0.01000,0.988
16,mlp.up_proj,12.35648727,0.01000,1.032
16,mlp.gate_proj,12.38793182,0.01000,0.940
16,mlp.down_proj,6.66818047,0.01000,3.435
17,self_attn.k_proj,0.70203781,0.01000,1.014
17,self_attn.v_proj,0.78936088,0.01000,0.966
17,self_attn.q_proj,2.84893632,0.01000,0.963
17,self_attn.o_proj,1.12227607,0.01000,0.990
17,mlp.up_proj,12.15243912,0.01000,1.031
17,mlp.gate_proj,11.83664322,0.01000,0.931
17,mlp.down_proj,4.39354229,0.01000,3.308
18,self_attn.k_proj,0.81414771,0.01000,1.014
18,self_attn.v_proj,0.88813567,0.01000,0.906
18,self_attn.q_proj,3.11169171,0.01000,0.905
18,self_attn.o_proj,1.17401302,0.01000,0.991
18,mlp.up_proj,13.63390160,0.01000,1.054
18,mlp.gate_proj,13.29291534,0.01000,0.934
18,mlp.down_proj,4.49146700,0.01000,3.284
19,self_attn.k_proj,1.63328815,0.01000,1.009
19,self_attn.v_proj,1.73570788,0.01000,0.896
19,self_attn.q_proj,6.42503834,0.01000,0.901
19,self_attn.o_proj,2.07196093,0.01000,0.985
19,mlp.up_proj,15.83341026,0.01000,1.027
19,mlp.gate_proj,15.20757008,0.01000,0.926
19,mlp.down_proj,5.84636164,0.01000,3.285
20,self_attn.k_proj,1.39802408,0.01000,1.014
20,self_attn.v_proj,1.61639774,0.01000,0.911
20,self_attn.q_proj,6.03697252,0.01000,0.911
20,self_attn.o_proj,1.88721895,0.01000,1.008
20,mlp.up_proj,17.48505592,0.01000,1.048
20,mlp.gate_proj,16.52001953,0.01000,0.952
20,mlp.down_proj,6.67660427,0.01000,3.350
21,self_attn.k_proj,1.91823614,0.01000,1.029
21,self_attn.v_proj,2.32567382,0.01000,0.907
21,self_attn.q_proj,7.96147728,0.01000,0.913
21,self_attn.o_proj,2.20767069,0.01000,0.985
21,mlp.up_proj,20.54163170,0.01000,1.029
21,mlp.gate_proj,19.23807144,0.01000,0.973
21,mlp.down_proj,8.76621437,0.01000,3.410
22,self_attn.k_proj,4.29426956,0.01000,1.011
22,self_attn.v_proj,4.63158703,0.01000,0.946
22,self_attn.q_proj,16.66217995,0.01000,0.958
22,self_attn.o_proj,4.14088964,0.01000,0.984
22,mlp.up_proj,23.75897598,0.01000,1.034
22,mlp.gate_proj,22.41718292,0.01000,0.916
22,mlp.down_proj,14.20706463,0.01000,3.275
23,self_attn.k_proj,4.23601627,0.01000,1.024
23,self_attn.v_proj,5.31139517,0.01000,0.894
23,self_attn.q_proj,17.59301758,0.01000,0.907
23,self_attn.o_proj,6.05393505,0.01000,0.986
23,mlp.up_proj,27.09676933,0.01000,1.027
23,mlp.gate_proj,26.27134895,0.01000,0.929
23,mlp.down_proj,19.55945587,0.01000,3.314
24,self_attn.k_proj,7.49891663,0.01000,1.009
24,self_attn.v_proj,9.87843990,0.01000,0.900
24,self_attn.q_proj,30.90993500,0.01000,0.905
24,self_attn.o_proj,7.09949207,0.01000,0.993
24,mlp.up_proj,29.73819351,0.01000,1.040
24,mlp.gate_proj,29.18134117,0.01000,0.942
24,mlp.down_proj,22.95422173,0.01000,3.219
25,self_attn.k_proj,5.93120480,0.01000,0.990
25,self_attn.v_proj,7.25453568,0.01000,0.884
25,self_attn.q_proj,23.64049149,0.01000,0.891
25,self_attn.o_proj,4.29439020,0.01000,0.991
25,mlp.up_proj,33.44628143,0.01000,1.027
25,mlp.gate_proj,33.19001007,0.01000,0.934
25,mlp.down_proj,28.41608047,0.01000,3.299
26,self_attn.k_proj,9.55083275,0.01000,1.000
26,self_attn.v_proj,11.93259716,0.01000,0.894
26,self_attn.q_proj,39.13488007,0.01000,0.929
26,self_attn.o_proj,5.03051233,0.01000,1.002
26,mlp.up_proj,39.99806213,0.01000,1.058
26,mlp.gate_proj,39.10617828,0.01000,0.963
26,mlp.down_proj,32.86630249,0.01000,3.272
27,self_attn.k_proj,10.59832382,0.01000,0.986
27,self_attn.v_proj,14.43760967,0.01000,0.870
27,self_attn.q_proj,44.33682251,0.01000,0.880
27,self_attn.o_proj,5.79099655,0.01000,1.017
27,mlp.up_proj,45.47875977,0.01000,1.005
27,mlp.gate_proj,43.69628525,0.01000,0.905
27,mlp.down_proj,44.36285400,0.01000,3.205
28,self_attn.k_proj,12.43419266,0.01000,1.013
28,self_attn.v_proj,14.42409134,0.01000,0.894
28,self_attn.q_proj,48.00852966,0.01000,0.909
28,self_attn.o_proj,8.68338013,0.01000,0.988
28,mlp.up_proj,53.02674866,0.01000,1.028
28,mlp.gate_proj,49.65861511,0.01000,0.953
28,mlp.down_proj,61.60363007,0.01000,3.297
29,self_attn.k_proj,27.99073219,0.01000,1.007
29,self_attn.v_proj,41.02116013,0.01000,0.898
29,self_attn.q_proj,110.08837128,0.01000,0.934
29,self_attn.o_proj,10.62466049,0.01000,0.979
29,mlp.up_proj,62.11631393,0.01000,1.074
29,mlp.gate_proj,56.42256927,0.01000,0.930
29,mlp.down_proj,68.38681793,0.01000,3.414
30,self_attn.k_proj,32.98537445,0.01000,1.009
30,self_attn.v_proj,43.16372681,0.01000,0.891
30,self_attn.q_proj,124.46414185,0.01000,0.938
30,self_attn.o_proj,13.77541351,0.01000,0.981
30,mlp.up_proj,67.29389954,0.01000,1.027
30,mlp.gate_proj,59.62668991,0.01000,0.923
30,mlp.down_proj,89.72830963,0.01000,3.275
31,self_attn.k_proj,46.93622589,0.01000,1.027
31,self_attn.v_proj,64.97520447,0.01000,0.920
31,self_attn.q_proj,163.56146240,0.01000,0.937
31,self_attn.o_proj,17.66180038,0.01000,1.062
31,mlp.up_proj,71.82790375,0.01000,1.088
31,mlp.gate_proj,61.58316803,0.01000,0.994
31,mlp.down_proj,114.22307587,0.01000,3.326
32,self_attn.k_proj,62.93231964,0.01000,1.021
32,self_attn.v_proj,95.09659576,0.01000,0.942
32,self_attn.q_proj,239.13937378,0.01000,0.971
32,self_attn.o_proj,23.94524765,0.01000,1.019
32,mlp.up_proj,76.42587280,0.01000,1.059
32,mlp.gate_proj,64.23219299,0.01000,0.974
32,mlp.down_proj,146.99580383,0.01000,3.355
33,self_attn.k_proj,110.83970642,0.01000,1.083
33,self_attn.v_proj,209.03472900,0.01000,0.965
33,self_attn.q_proj,481.74597168,0.01000,0.972
33,self_attn.o_proj,42.13233948,0.01000,1.017
33,mlp.up_proj,81.78762817,0.01000,1.044
33,mlp.gate_proj,67.68517303,0.01000,0.946
33,mlp.down_proj,187.10368347,0.01000,3.384
34,self_attn.k_proj,90.71221924,0.01000,1.025
34,self_attn.v_proj,140.87960815,0.01000,0.908
34,self_attn.q_proj,391.42230225,0.01000,0.916
34,self_attn.o_proj,66.00537109,0.01000,1.001
34,mlp.up_proj,86.06692505,0.01000,1.041
34,mlp.gate_proj,75.02056885,0.01000,0.942
34,mlp.down_proj,238.53738403,0.01000,3.375
35,self_attn.k_proj,43.20785522,0.01000,1.027
35,self_attn.v_proj,56.80477142,0.01000,0.914
35,self_attn.q_proj,161.02618408,0.01000,0.927
35,self_attn.o_proj,46.36551285,0.01000,1.002
35,mlp.up_proj,110.93260193,0.01000,1.087
35,mlp.gate_proj,101.52717590,0.01000,0.995
35,mlp.down_proj,446.22875977,0.01000,3.489