File size: 8,774 Bytes
5267471
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.45799875,0.01000,1.229
0,self_attn.v_proj,0.07609060,0.01000,0.792
0,self_attn.q_proj,2.12163448,0.01000,0.794
0,self_attn.o_proj,0.15833434,0.01000,0.797
0,mlp.up_proj,3.44300270,0.01000,1.198
0,mlp.gate_proj,9.25297356,0.01000,0.798
0,mlp.down_proj,0.70674431,0.01000,6.319
1,self_attn.k_proj,0.32750565,0.01000,0.812
1,self_attn.v_proj,0.07779335,0.01000,0.792
1,self_attn.q_proj,1.19940567,0.01000,0.791
1,self_attn.o_proj,0.03534722,0.01000,0.790
1,mlp.up_proj,47.91104126,0.01000,1.130
1,mlp.gate_proj,72.21174622,0.01000,0.795
1,mlp.down_proj,0.47584903,0.01000,5.495
2,self_attn.k_proj,0.97978824,0.01000,0.793
2,self_attn.v_proj,0.17162688,0.01000,0.783
2,self_attn.q_proj,3.59054279,0.01000,0.813
2,self_attn.o_proj,0.07696313,0.01000,0.809
2,mlp.up_proj,51.86732101,0.01000,0.978
2,mlp.gate_proj,81.22796631,0.01000,0.788
2,mlp.down_proj,0.57132983,0.01000,5.332
3,self_attn.k_proj,1.00729656,0.01000,0.798
3,self_attn.v_proj,0.24603574,0.01000,0.787
3,self_attn.q_proj,3.74738932,0.01000,0.792
3,self_attn.o_proj,0.28664696,0.01000,0.793
3,mlp.up_proj,117.40467834,0.01000,1.395
3,mlp.gate_proj,149.96266174,0.01000,0.794
3,mlp.down_proj,0.50525832,0.01250,5.778
4,self_attn.k_proj,1.65046954,0.01000,0.809
4,self_attn.v_proj,0.50013733,0.01000,0.802
4,self_attn.q_proj,7.17262077,0.01000,0.792
4,self_attn.o_proj,0.18240610,0.01000,0.797
4,mlp.up_proj,95.23252869,0.01000,1.478
4,mlp.gate_proj,135.10296631,0.01000,0.792
4,mlp.down_proj,1.10169077,0.01000,5.773
5,self_attn.k_proj,1.48517931,0.01000,0.799
5,self_attn.v_proj,0.57455540,0.01000,0.785
5,self_attn.q_proj,7.11627245,0.01000,0.786
5,self_attn.o_proj,0.18029036,0.01000,0.791
5,mlp.up_proj,137.73837280,0.01000,1.454
5,mlp.gate_proj,163.93475342,0.01000,0.792
5,mlp.down_proj,0.72991610,0.01000,5.101
6,self_attn.k_proj,0.91666269,0.01000,0.797
6,self_attn.v_proj,0.45087141,0.01000,0.784
6,self_attn.q_proj,4.46909571,0.01000,0.785
6,self_attn.o_proj,0.25428528,0.01000,0.794
6,mlp.up_proj,27.69116974,0.01000,1.101
6,mlp.gate_proj,38.12742615,0.01000,0.787
6,mlp.down_proj,1.80558443,0.01000,5.593
7,self_attn.k_proj,0.87672055,0.01000,0.801
7,self_attn.v_proj,0.77675360,0.01000,0.784
7,self_attn.q_proj,4.90382957,0.01000,0.785
7,self_attn.o_proj,0.60036409,0.01000,0.792
7,mlp.up_proj,25.44780350,0.01000,0.956
7,mlp.gate_proj,27.46134949,0.01000,0.790
7,mlp.down_proj,3.39160872,0.01000,5.749
8,self_attn.k_proj,1.73226166,0.01000,0.796
8,self_attn.v_proj,0.68621767,0.01000,0.784
8,self_attn.q_proj,7.69679880,0.01000,0.785
8,self_attn.o_proj,0.73930031,0.01000,0.788
8,mlp.up_proj,30.87631607,0.01000,0.939
8,mlp.gate_proj,31.48957253,0.01000,0.789
8,mlp.down_proj,3.74254274,0.01000,5.757
9,self_attn.k_proj,1.36867046,0.01000,0.794
9,self_attn.v_proj,1.12786245,0.01000,0.784
9,self_attn.q_proj,7.48112011,0.01000,0.786
9,self_attn.o_proj,1.36345375,0.01000,0.792
9,mlp.up_proj,60.58055878,0.01000,0.998
9,mlp.gate_proj,94.33630371,0.01000,0.793
9,mlp.down_proj,3.87477875,0.01000,4.974
10,self_attn.k_proj,1.37036932,0.01000,0.792
10,self_attn.v_proj,0.75882816,0.01000,0.782
10,self_attn.q_proj,6.94236088,0.01000,0.793
10,self_attn.o_proj,0.75480914,0.01000,0.803
10,mlp.up_proj,35.29159164,0.01000,0.841
10,mlp.gate_proj,38.67882538,0.01000,0.803
10,mlp.down_proj,3.74935198,0.01000,4.797
11,self_attn.k_proj,1.67335296,0.01000,0.795
11,self_attn.v_proj,0.65093291,0.01000,0.786
11,self_attn.q_proj,7.30354977,0.01000,0.786
11,self_attn.o_proj,1.00513470,0.01000,0.791
11,mlp.up_proj,33.77320480,0.01000,0.914
11,mlp.gate_proj,34.57297897,0.01000,0.791
11,mlp.down_proj,3.76886940,0.01000,5.628
12,self_attn.k_proj,1.86318445,0.01000,0.795
12,self_attn.v_proj,0.91608346,0.01000,0.785
12,self_attn.q_proj,8.48820114,0.01000,0.789
12,self_attn.o_proj,1.22396874,0.01000,0.792
12,mlp.up_proj,34.66112900,0.01000,1.025
12,mlp.gate_proj,33.52517319,0.01000,0.796
12,mlp.down_proj,4.20871687,0.01000,5.509
13,self_attn.k_proj,1.71873260,0.01000,0.796
13,self_attn.v_proj,1.17398250,0.01000,0.784
13,self_attn.q_proj,9.26076698,0.01000,0.786
13,self_attn.o_proj,1.98672080,0.01000,0.793
13,mlp.up_proj,34.07032013,0.01000,0.979
13,mlp.gate_proj,35.38600159,0.01000,0.792
13,mlp.down_proj,4.01914883,0.01000,5.745
14,self_attn.k_proj,2.35059500,0.01000,0.794
14,self_attn.v_proj,1.07187366,0.01000,0.785
14,self_attn.q_proj,12.55565739,0.01000,0.786
14,self_attn.o_proj,1.66337204,0.01000,0.796
14,mlp.up_proj,37.50673294,0.01000,1.044
14,mlp.gate_proj,36.76043701,0.01000,0.789
14,mlp.down_proj,4.56406212,0.01000,5.484
15,self_attn.k_proj,2.22288537,0.01000,0.796
15,self_attn.v_proj,0.94591284,0.01000,0.783
15,self_attn.q_proj,10.25840569,0.01000,0.787
15,self_attn.o_proj,1.22425127,0.01000,0.793
15,mlp.up_proj,35.22077942,0.01000,0.948
15,mlp.gate_proj,33.73355103,0.01000,0.790
15,mlp.down_proj,4.56615782,0.01000,5.648
16,self_attn.k_proj,1.99345851,0.01000,0.795
16,self_attn.v_proj,1.18918204,0.01000,0.785
16,self_attn.q_proj,10.32095146,0.01000,0.787
16,self_attn.o_proj,1.96564627,0.01000,0.796
16,mlp.up_proj,36.18003464,0.01000,1.343
16,mlp.gate_proj,34.63485718,0.01000,0.791
16,mlp.down_proj,4.48285961,0.01000,4.960
17,self_attn.k_proj,2.12233758,0.01000,0.793
17,self_attn.v_proj,1.49488401,0.01000,0.782
17,self_attn.q_proj,12.03779602,0.01000,0.786
17,self_attn.o_proj,1.56383574,0.01000,0.789
17,mlp.up_proj,43.32733917,0.01000,0.995
17,mlp.gate_proj,40.48381042,0.01000,0.790
17,mlp.down_proj,6.09112692,0.01000,4.888
18,self_attn.k_proj,1.62858880,0.01000,0.796
18,self_attn.v_proj,1.68938899,0.01000,0.785
18,self_attn.q_proj,9.95006275,0.01000,0.787
18,self_attn.o_proj,2.32261109,0.01000,0.792
18,mlp.up_proj,46.56050110,0.01000,0.908
18,mlp.gate_proj,42.73928833,0.01000,0.808
18,mlp.down_proj,6.82586384,0.01000,4.930
19,self_attn.k_proj,1.68053222,0.01000,0.812
19,self_attn.v_proj,2.05788898,0.01000,0.788
19,self_attn.q_proj,12.11944962,0.01000,0.784
19,self_attn.o_proj,2.68917871,0.01000,0.789
19,mlp.up_proj,52.29275131,0.01000,1.517
19,mlp.gate_proj,49.98110962,0.01000,0.798
19,mlp.down_proj,7.88660431,0.01000,5.795
20,self_attn.k_proj,1.84464359,0.01000,0.797
20,self_attn.v_proj,2.35779238,0.01000,0.785
20,self_attn.q_proj,11.92081356,0.01000,0.788
20,self_attn.o_proj,1.61213660,0.01000,0.795
20,mlp.up_proj,67.74790955,0.01000,1.324
20,mlp.gate_proj,64.78291321,0.01000,0.806
20,mlp.down_proj,14.59480381,0.01000,5.772
21,self_attn.k_proj,2.01086497,0.01000,0.800
21,self_attn.v_proj,3.80550861,0.01000,0.789
21,self_attn.q_proj,14.31709003,0.01000,0.788
21,self_attn.o_proj,7.11469269,0.01000,0.792
21,mlp.up_proj,90.64640808,0.01000,1.742
21,mlp.gate_proj,91.33148193,0.01000,0.789
21,mlp.down_proj,23.68573761,0.01000,5.691
22,self_attn.k_proj,2.82378864,0.01000,0.798
22,self_attn.v_proj,6.54322100,0.01000,0.785
22,self_attn.q_proj,20.41894722,0.01000,0.787
22,self_attn.o_proj,3.96613264,0.01000,0.793
22,mlp.up_proj,128.74058533,0.01000,1.051
22,mlp.gate_proj,127.80844116,0.01000,0.793
22,mlp.down_proj,41.23144150,0.01000,6.211
23,self_attn.k_proj,3.94794369,0.01000,0.796
23,self_attn.v_proj,10.11415863,0.01000,0.784
23,self_attn.q_proj,26.11191559,0.01000,0.787
23,self_attn.o_proj,9.28477287,0.01000,0.792
23,mlp.up_proj,182.26258850,0.01000,1.312
23,mlp.gate_proj,186.16828918,0.01000,0.787
23,mlp.down_proj,53.97393036,0.01000,5.231
24,self_attn.k_proj,3.14931726,0.01000,0.795
24,self_attn.v_proj,9.28114700,0.01000,0.788
24,self_attn.q_proj,23.26879501,0.01000,0.788
24,self_attn.o_proj,6.09074879,0.01000,0.791
24,mlp.up_proj,203.76696777,0.01000,1.037
24,mlp.gate_proj,193.12313843,0.01000,0.793
24,mlp.down_proj,70.43853760,0.01000,5.950
25,self_attn.k_proj,3.83410430,0.01000,0.806
25,self_attn.v_proj,15.94288731,0.01000,0.786
25,self_attn.q_proj,27.39394951,0.01000,0.787
25,self_attn.o_proj,9.11356163,0.01000,0.790
25,mlp.up_proj,267.07983398,0.01000,0.970
25,mlp.gate_proj,239.64936829,0.01000,0.796
25,mlp.down_proj,104.45835876,0.01000,5.545
26,self_attn.k_proj,5.11287212,0.01000,0.794
26,self_attn.v_proj,36.42906952,0.01000,0.784
26,self_attn.q_proj,40.85954285,0.01000,0.785
26,self_attn.o_proj,14.15282249,0.01000,0.791
26,mlp.up_proj,270.81805420,0.01000,0.976
26,mlp.gate_proj,238.73959351,0.01000,0.789
26,mlp.down_proj,0.00537085,0.01250,6.699
27,self_attn.k_proj,6.07175827,0.01000,0.808
27,self_attn.v_proj,53.75015259,0.01000,0.787
27,self_attn.q_proj,63.93183899,0.01000,0.789
27,self_attn.o_proj,21.21239853,0.01000,0.790
27,mlp.up_proj,344.58737183,0.01000,0.844
27,mlp.gate_proj,329.91827393,0.01000,0.789
27,mlp.down_proj,327.33453369,0.01000,5.639