File size: 8,834 Bytes
72efa40
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.84503669,0.01000,0.847
0,self_attn.v_proj,0.09790013,0.01000,0.621
0,self_attn.q_proj,3.45275998,0.01000,0.623
0,self_attn.o_proj,0.02797472,0.01000,0.716
0,mlp.up_proj,6.59510899,0.01000,0.753
0,mlp.gate_proj,14.64342403,0.01000,0.634
0,mlp.down_proj,0.54082263,0.01000,4.907
1,self_attn.k_proj,0.66450667,0.01000,0.755
1,self_attn.v_proj,0.13586605,0.01000,0.624
1,self_attn.q_proj,2.53379679,0.01000,0.622
1,self_attn.o_proj,0.01710801,0.01000,0.720
1,mlp.up_proj,56.40869904,0.01000,0.752
1,mlp.gate_proj,94.36625671,0.01000,0.638
1,mlp.down_proj,0.48488298,0.01000,4.885
2,self_attn.k_proj,1.85023427,0.01000,0.758
2,self_attn.v_proj,0.29796562,0.01000,0.620
2,self_attn.q_proj,6.63527250,0.01000,0.624
2,self_attn.o_proj,0.05357596,0.01000,0.721
2,mlp.up_proj,72.35107422,0.01000,0.754
2,mlp.gate_proj,120.69715118,0.01000,0.637
2,mlp.down_proj,0.71529531,0.01000,4.897
3,self_attn.k_proj,1.83869004,0.01000,0.816
3,self_attn.v_proj,0.42401373,0.01000,0.667
3,self_attn.q_proj,6.90928888,0.01000,0.638
3,self_attn.o_proj,0.22543210,0.01000,0.795
3,mlp.up_proj,199.29341125,0.01000,0.756
3,mlp.gate_proj,270.88391113,0.01000,0.641
3,mlp.down_proj,1.02437985,0.01000,4.892
4,self_attn.k_proj,3.05090141,0.01000,0.757
4,self_attn.v_proj,0.90732384,0.01000,0.623
4,self_attn.q_proj,12.91889858,0.01000,0.622
4,self_attn.o_proj,0.16272199,0.01000,0.724
4,mlp.up_proj,177.98535156,0.01000,0.751
4,mlp.gate_proj,268.20730591,0.01000,0.635
4,mlp.down_proj,1.51549566,0.01000,4.892
5,self_attn.k_proj,3.06540680,0.01000,0.769
5,self_attn.v_proj,1.12325358,0.01000,0.625
5,self_attn.q_proj,14.62543392,0.01000,0.622
5,self_attn.o_proj,0.21586980,0.01000,0.719
5,mlp.up_proj,267.72155762,0.01000,0.769
5,mlp.gate_proj,343.41455078,0.01000,0.638
5,mlp.down_proj,1.18007314,0.01000,4.889
6,self_attn.k_proj,2.07387280,0.01000,0.755
6,self_attn.v_proj,0.94506907,0.01000,0.621
6,self_attn.q_proj,9.86525154,0.01000,0.625
6,self_attn.o_proj,0.26159465,0.01000,0.720
6,mlp.up_proj,66.96002197,0.01000,0.760
6,mlp.gate_proj,95.20739746,0.01000,0.634
6,mlp.down_proj,3.78148937,0.01000,4.891
7,self_attn.k_proj,2.32142448,0.01000,0.754
7,self_attn.v_proj,1.96631455,0.01000,0.621
7,self_attn.q_proj,12.40788651,0.01000,0.621
7,self_attn.o_proj,0.92824316,0.01000,0.718
7,mlp.up_proj,66.62113190,0.01000,0.756
7,mlp.gate_proj,74.05113220,0.01000,0.640
7,mlp.down_proj,6.63149881,0.01000,4.882
8,self_attn.k_proj,4.55058146,0.01000,0.755
8,self_attn.v_proj,1.65348577,0.01000,0.632
8,self_attn.q_proj,18.91058159,0.01000,0.649
8,self_attn.o_proj,1.66989470,0.01000,0.720
8,mlp.up_proj,79.65923309,0.01000,0.748
8,mlp.gate_proj,83.44503021,0.01000,0.634
8,mlp.down_proj,7.66813326,0.01000,4.916
9,self_attn.k_proj,3.84148502,0.01000,0.754
9,self_attn.v_proj,2.96535730,0.01000,0.622
9,self_attn.q_proj,20.20914268,0.01000,0.626
9,self_attn.o_proj,2.59902573,0.01000,0.719
9,mlp.up_proj,156.97390747,0.01000,0.753
9,mlp.gate_proj,251.82458496,0.01000,0.638
9,mlp.down_proj,8.60938835,0.01000,4.885
10,self_attn.k_proj,4.07611465,0.01000,0.755
10,self_attn.v_proj,2.05425596,0.01000,0.622
10,self_attn.q_proj,19.85713577,0.01000,0.623
10,self_attn.o_proj,1.43030739,0.01000,0.720
10,mlp.up_proj,100.09529114,0.01000,0.749
10,mlp.gate_proj,113.80771637,0.01000,0.640
10,mlp.down_proj,8.42348957,0.01000,4.895
11,self_attn.k_proj,5.21213436,0.01000,0.755
11,self_attn.v_proj,1.78169560,0.01000,0.624
11,self_attn.q_proj,21.62147522,0.01000,0.625
11,self_attn.o_proj,2.29331183,0.01000,0.719
11,mlp.up_proj,95.10997009,0.01000,0.754
11,mlp.gate_proj,100.02523804,0.01000,0.638
11,mlp.down_proj,8.73736763,0.01000,4.897
12,self_attn.k_proj,5.94782352,0.01000,0.752
12,self_attn.v_proj,2.57430744,0.01000,0.623
12,self_attn.q_proj,25.37301826,0.01000,0.624
12,self_attn.o_proj,2.74405336,0.01000,0.720
12,mlp.up_proj,99.41949463,0.01000,0.760
12,mlp.gate_proj,98.57714081,0.01000,0.635
12,mlp.down_proj,10.31996155,0.01000,4.876
13,self_attn.k_proj,5.70451880,0.01000,0.753
13,self_attn.v_proj,3.61313081,0.01000,0.620
13,self_attn.q_proj,28.92498398,0.01000,0.623
13,self_attn.o_proj,5.05193090,0.01000,0.717
13,mlp.up_proj,102.82405853,0.01000,0.753
13,mlp.gate_proj,109.35607910,0.01000,0.674
13,mlp.down_proj,10.62277031,0.01000,4.872
14,self_attn.k_proj,8.16368103,0.01000,0.750
14,self_attn.v_proj,3.29415512,0.01000,0.616
14,self_attn.q_proj,40.57175064,0.01000,0.618
14,self_attn.o_proj,3.70151019,0.01000,0.719
14,mlp.up_proj,116.39168549,0.01000,0.752
14,mlp.gate_proj,117.40150452,0.01000,0.637
14,mlp.down_proj,12.35162067,0.01000,4.897
15,self_attn.k_proj,7.40435266,0.01000,0.754
15,self_attn.v_proj,2.82182503,0.01000,0.629
15,self_attn.q_proj,32.03612518,0.01000,0.622
15,self_attn.o_proj,2.86537886,0.01000,0.720
15,mlp.up_proj,109.34799194,0.01000,0.816
15,mlp.gate_proj,106.16775513,0.01000,0.652
15,mlp.down_proj,11.65571213,0.01000,4.899
16,self_attn.k_proj,7.20972252,0.01000,0.750
16,self_attn.v_proj,3.81571937,0.01000,0.615
16,self_attn.q_proj,35.60685730,0.01000,0.617
16,self_attn.o_proj,4.76396894,0.01000,0.718
16,mlp.up_proj,119.07849121,0.01000,0.753
16,mlp.gate_proj,115.41696167,0.01000,0.654
16,mlp.down_proj,13.42798615,0.01000,4.888
17,self_attn.k_proj,7.86328506,0.01000,0.756
17,self_attn.v_proj,4.99391937,0.01000,0.622
17,self_attn.q_proj,41.75648499,0.01000,0.624
17,self_attn.o_proj,3.45894480,0.01000,0.719
17,mlp.up_proj,143.43394470,0.01000,0.754
17,mlp.gate_proj,136.14013672,0.01000,0.643
17,mlp.down_proj,17.81203842,0.01000,4.882
18,self_attn.k_proj,6.22359562,0.01000,0.753
18,self_attn.v_proj,6.02423716,0.01000,0.624
18,self_attn.q_proj,35.44544601,0.01000,0.624
18,self_attn.o_proj,4.30885458,0.01000,0.722
18,mlp.up_proj,153.58898926,0.01000,0.760
18,mlp.gate_proj,142.47561646,0.01000,0.637
18,mlp.down_proj,18.25153732,0.01000,4.894
19,self_attn.k_proj,5.90289783,0.01000,0.757
19,self_attn.v_proj,6.39343739,0.01000,0.623
19,self_attn.q_proj,38.50756073,0.01000,0.624
19,self_attn.o_proj,5.47891045,0.01000,0.719
19,mlp.up_proj,163.33058167,0.01000,0.758
19,mlp.gate_proj,157.55880737,0.01000,0.635
19,mlp.down_proj,19.15095139,0.01000,4.872
20,self_attn.k_proj,6.11784792,0.01000,0.756
20,self_attn.v_proj,7.04739285,0.01000,0.625
20,self_attn.q_proj,36.47023392,0.01000,0.623
20,self_attn.o_proj,2.35553312,0.01000,0.717
20,mlp.up_proj,198.99542236,0.01000,0.750
20,mlp.gate_proj,190.01835632,0.01000,0.637
20,mlp.down_proj,32.01580811,0.01000,4.894
21,self_attn.k_proj,6.29537106,0.01000,0.758
21,self_attn.v_proj,10.25707436,0.01000,0.621
21,self_attn.q_proj,41.46713257,0.01000,0.621
21,self_attn.o_proj,8.36542606,0.01000,0.720
21,mlp.up_proj,250.49508667,0.01000,0.751
21,mlp.gate_proj,251.44859314,0.01000,0.636
21,mlp.down_proj,43.56330109,0.01000,4.881
22,self_attn.k_proj,8.49018574,0.01000,0.758
22,self_attn.v_proj,17.15532875,0.01000,0.622
22,self_attn.q_proj,56.59531021,0.01000,0.622
22,self_attn.o_proj,3.68090487,0.01000,0.717
22,mlp.up_proj,337.93640137,0.01000,0.756
22,mlp.gate_proj,333.52142334,0.01000,0.632
22,mlp.down_proj,67.46343994,0.01000,4.917
23,self_attn.k_proj,12.21148396,0.01000,0.757
23,self_attn.v_proj,25.81269073,0.01000,0.621
23,self_attn.q_proj,71.46172333,0.01000,0.623
23,self_attn.o_proj,11.98000240,0.01000,0.720
23,mlp.up_proj,483.65325928,0.01000,0.752
23,mlp.gate_proj,493.06561279,0.01000,0.635
23,mlp.down_proj,85.32797241,0.01000,4.916
24,self_attn.k_proj,9.50092220,0.01000,0.755
24,self_attn.v_proj,26.38395882,0.01000,0.623
24,self_attn.q_proj,66.23488617,0.01000,0.624
24,self_attn.o_proj,8.46130848,0.01000,0.730
24,mlp.up_proj,575.74047852,0.01000,0.748
24,mlp.gate_proj,538.54052734,0.01000,0.636
24,mlp.down_proj,111.23144531,0.01000,4.899
25,self_attn.k_proj,11.69873905,0.01000,0.754
25,self_attn.v_proj,50.58491135,0.01000,0.623
25,self_attn.q_proj,81.08997345,0.01000,0.622
25,self_attn.o_proj,11.35678291,0.01000,0.721
25,mlp.up_proj,770.88513184,0.01000,0.761
25,mlp.gate_proj,682.92773438,0.01000,0.637
25,mlp.down_proj,195.86593628,0.01000,4.877
26,self_attn.k_proj,15.98041534,0.01000,0.748
26,self_attn.v_proj,117.35370636,0.01000,0.618
26,self_attn.q_proj,119.34364319,0.01000,0.628
26,self_attn.o_proj,26.08083153,0.01000,0.716
26,mlp.up_proj,769.50878906,0.01000,0.747
26,mlp.gate_proj,671.80041504,0.01000,0.633
26,mlp.down_proj,279.47283936,0.01000,4.886
27,self_attn.k_proj,19.93762970,0.01000,0.750
27,self_attn.v_proj,191.60113525,0.01000,0.616
27,self_attn.q_proj,190.72473145,0.01000,0.619
27,self_attn.o_proj,32.69224930,0.01000,0.715
27,mlp.up_proj,870.30517578,0.01000,0.751
27,mlp.gate_proj,839.04919434,0.01000,0.634
27,mlp.down_proj,378.88079834,0.01000,4.875