File size: 8,813 Bytes
fe96820
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.11147800,0.01000,0.458
0,self_attn.v_proj,0.08630855,0.01000,0.219
0,self_attn.q_proj,0.25900897,0.01000,0.222
0,self_attn.o_proj,0.07599418,0.01000,0.450
0,mlp.up_proj,1.53504455,0.01000,0.232
0,mlp.gate_proj,3.04540825,0.01000,0.218
0,mlp.down_proj,0.08534984,0.01000,0.677
1,self_attn.k_proj,0.05401947,0.01000,0.235
1,self_attn.v_proj,0.05086039,0.01000,0.220
1,self_attn.q_proj,0.12237675,0.01000,0.220
1,self_attn.o_proj,0.01379651,0.01000,0.451
1,mlp.up_proj,5.61016464,0.01000,0.231
1,mlp.gate_proj,19.20188904,0.01000,0.219
1,mlp.down_proj,0.10827485,0.01000,0.678
2,self_attn.k_proj,0.10099948,0.01000,0.233
2,self_attn.v_proj,0.09610087,0.01000,0.219
2,self_attn.q_proj,0.23747258,0.01000,0.219
2,self_attn.o_proj,0.02400546,0.01000,0.450
2,mlp.up_proj,4.73568106,0.01000,0.232
2,mlp.gate_proj,13.18591118,0.01000,0.220
2,mlp.down_proj,4.35225487,0.01000,0.682
3,self_attn.k_proj,0.84643447,0.01000,0.236
3,self_attn.v_proj,0.85565448,0.01000,0.221
3,self_attn.q_proj,1.74525285,0.01000,0.222
3,self_attn.o_proj,0.05005993,0.01000,0.452
3,mlp.up_proj,6.21245098,0.01000,0.232
3,mlp.gate_proj,16.04592896,0.01000,0.222
3,mlp.down_proj,0.34597254,0.01000,0.682
4,self_attn.k_proj,0.78725469,0.01000,0.234
4,self_attn.v_proj,0.80693889,0.01000,0.220
4,self_attn.q_proj,1.57810068,0.01000,0.222
4,self_attn.o_proj,0.10350977,0.01000,0.453
4,mlp.up_proj,6.71505690,0.01000,0.234
4,mlp.gate_proj,15.28214741,0.01000,0.222
4,mlp.down_proj,0.41565913,0.01000,0.681
5,self_attn.k_proj,1.20404196,0.01000,0.234
5,self_attn.v_proj,1.30846250,0.01000,0.221
5,self_attn.q_proj,2.90022326,0.01000,0.221
5,self_attn.o_proj,0.11212036,0.01000,0.453
5,mlp.up_proj,6.31282043,0.01000,0.232
5,mlp.gate_proj,10.49855423,0.01000,0.219
5,mlp.down_proj,0.48409772,0.01000,0.681
6,self_attn.k_proj,0.93520665,0.01000,0.234
6,self_attn.v_proj,0.87466520,0.01000,0.221
6,self_attn.q_proj,2.08447576,0.01000,0.233
6,self_attn.o_proj,0.11541309,0.01000,0.453
6,mlp.up_proj,8.37039280,0.01000,0.232
6,mlp.gate_proj,13.32755280,0.01000,0.221
6,mlp.down_proj,0.70866877,0.01000,0.682
7,self_attn.k_proj,1.72509587,0.01000,0.232
7,self_attn.v_proj,1.93890357,0.01000,0.217
7,self_attn.q_proj,4.17893887,0.01000,0.215
7,self_attn.o_proj,0.14572459,0.01000,0.443
7,mlp.up_proj,9.48272038,0.01000,0.227
7,mlp.gate_proj,15.29617691,0.01000,0.215
7,mlp.down_proj,0.81154561,0.01000,0.710
8,self_attn.k_proj,2.27103615,0.01000,0.238
8,self_attn.v_proj,2.20937443,0.01000,0.224
8,self_attn.q_proj,5.15229893,0.01000,0.241
8,self_attn.o_proj,0.17240790,0.01000,0.446
8,mlp.up_proj,10.42674160,0.01000,0.243
8,mlp.gate_proj,16.20728493,0.01000,0.231
8,mlp.down_proj,1.09275961,0.01000,0.822
9,self_attn.k_proj,4.16666269,0.01000,1.138
9,self_attn.v_proj,4.43104601,0.01000,0.376
9,self_attn.q_proj,10.31816101,0.01000,0.415
9,self_attn.o_proj,0.31887323,0.01000,0.840
9,mlp.up_proj,12.31618500,0.01000,1.191
9,mlp.gate_proj,19.54656982,0.01000,1.154
9,mlp.down_proj,1.64975393,0.01000,2.770
10,self_attn.k_proj,3.93787289,0.01000,0.553
10,self_attn.v_proj,4.10471725,0.01000,1.859
10,self_attn.q_proj,9.49951458,0.01000,1.888
10,self_attn.o_proj,0.27260423,0.01000,0.464
10,mlp.up_proj,12.69118309,0.01000,0.238
10,mlp.gate_proj,20.18230057,0.01000,0.225
10,mlp.down_proj,2.11628580,0.01000,0.696
11,self_attn.k_proj,7.30851555,0.01000,0.237
11,self_attn.v_proj,6.77896643,0.01000,0.224
11,self_attn.q_proj,19.34665871,0.01000,0.225
11,self_attn.o_proj,0.66791785,0.01000,0.476
11,mlp.up_proj,13.51113892,0.01000,0.236
11,mlp.gate_proj,17.58659363,0.01000,0.224
11,mlp.down_proj,2.87829471,0.01000,0.691
12,self_attn.k_proj,7.20854664,0.01000,0.238
12,self_attn.v_proj,7.45390940,0.01000,0.224
12,self_attn.q_proj,19.43825531,0.01000,0.225
12,self_attn.o_proj,0.30023530,0.01000,0.460
12,mlp.up_proj,12.92345810,0.01000,0.238
12,mlp.gate_proj,15.76972866,0.01000,0.225
12,mlp.down_proj,2.75112391,0.01000,0.742
13,self_attn.k_proj,6.89573908,0.01000,0.238
13,self_attn.v_proj,8.19425392,0.01000,0.224
13,self_attn.q_proj,20.47906685,0.01000,0.224
13,self_attn.o_proj,0.44192302,0.01000,0.460
13,mlp.up_proj,13.60263252,0.01000,0.237
13,mlp.gate_proj,16.85786819,0.01000,0.224
13,mlp.down_proj,2.74464965,0.01000,0.694
14,self_attn.k_proj,9.22984314,0.01000,0.238
14,self_attn.v_proj,10.04637337,0.01000,0.222
14,self_attn.q_proj,25.66234970,0.01000,0.224
14,self_attn.o_proj,0.47217572,0.01000,0.462
14,mlp.up_proj,15.06594086,0.01000,0.235
14,mlp.gate_proj,18.42022133,0.01000,0.223
14,mlp.down_proj,3.77921104,0.01000,0.691
15,self_attn.k_proj,16.64938736,0.01000,0.238
15,self_attn.v_proj,20.63287735,0.01000,0.223
15,self_attn.q_proj,52.25179291,0.01000,0.224
15,self_attn.o_proj,0.78019929,0.01000,0.516
15,mlp.up_proj,16.64070892,0.01000,1.398
15,mlp.gate_proj,19.79901123,0.01000,1.352
15,mlp.down_proj,3.98885012,0.01000,1.246
16,self_attn.k_proj,23.15541840,0.01000,0.869
16,self_attn.v_proj,21.59778023,0.01000,0.406
16,self_attn.q_proj,65.96479797,0.01000,0.817
16,self_attn.o_proj,1.10674870,0.01000,1.846
16,mlp.up_proj,18.38120270,0.01000,0.439
16,mlp.gate_proj,20.62617493,0.01000,0.633
16,mlp.down_proj,7.29946709,0.01000,4.478
17,self_attn.k_proj,50.91555786,0.01000,0.994
17,self_attn.v_proj,62.10039520,0.01000,1.044
17,self_attn.q_proj,153.88165283,0.01000,1.083
17,self_attn.o_proj,2.35713625,0.01000,0.461
17,mlp.up_proj,28.26027870,0.01000,0.235
17,mlp.gate_proj,32.26748657,0.01000,0.223
17,mlp.down_proj,8.62757301,0.01000,0.693
18,self_attn.k_proj,47.62117004,0.01000,0.237
18,self_attn.v_proj,49.91074753,0.01000,0.224
18,self_attn.q_proj,148.18688965,0.01000,0.224
18,self_attn.o_proj,2.07341361,0.01000,0.459
18,mlp.up_proj,34.44437408,0.01000,0.237
18,mlp.gate_proj,39.49178314,0.01000,0.224
18,mlp.down_proj,13.71113110,0.01000,0.692
19,self_attn.k_proj,80.47894287,0.01000,0.239
19,self_attn.v_proj,90.67363739,0.01000,0.224
19,self_attn.q_proj,264.28625488,0.01000,0.232
19,self_attn.o_proj,4.05158710,0.01000,0.460
19,mlp.up_proj,43.40443420,0.01000,0.235
19,mlp.gate_proj,41.79368210,0.01000,0.224
19,mlp.down_proj,24.53729630,0.01000,0.693
20,self_attn.k_proj,111.07940674,0.01000,0.237
20,self_attn.v_proj,125.48833466,0.01000,0.223
20,self_attn.q_proj,326.05548096,0.01000,0.224
20,self_attn.o_proj,5.44219112,0.01000,0.461
20,mlp.up_proj,48.42160797,0.01000,0.236
20,mlp.gate_proj,43.89644623,0.01000,0.223
20,mlp.down_proj,28.64599991,0.01000,0.692
21,self_attn.k_proj,182.44018555,0.01000,0.238
21,self_attn.v_proj,234.88687134,0.01000,0.224
21,self_attn.q_proj,529.24645996,0.01000,0.234
21,self_attn.o_proj,9.00667953,0.01000,0.462
21,mlp.up_proj,57.38450623,0.01000,0.237
21,mlp.gate_proj,47.00152588,0.01000,0.224
21,mlp.down_proj,37.96351242,0.01000,0.700
22,self_attn.k_proj,201.98219299,0.01000,0.240
22,self_attn.v_proj,281.84835815,0.01000,0.238
22,self_attn.q_proj,535.36541748,0.01000,0.227
22,self_attn.o_proj,6.89678383,0.01000,0.476
22,mlp.up_proj,60.97026062,0.01000,0.238
22,mlp.gate_proj,48.76005554,0.01000,0.225
22,mlp.down_proj,38.75309753,0.01000,0.698
23,self_attn.k_proj,269.43804932,0.01000,0.239
23,self_attn.v_proj,304.47036743,0.01000,0.225
23,self_attn.q_proj,607.39343262,0.01000,0.226
23,self_attn.o_proj,13.71835327,0.01000,0.464
23,mlp.up_proj,68.53395844,0.01000,0.272
23,mlp.gate_proj,53.10926056,0.01000,0.257
23,mlp.down_proj,39.62349701,0.01000,0.691
24,self_attn.k_proj,446.88357544,0.01000,0.235
24,self_attn.v_proj,481.67712402,0.01000,0.221
24,self_attn.q_proj,1182.38500977,0.01000,0.223
24,self_attn.o_proj,11.81310463,0.01000,0.464
24,mlp.up_proj,64.03303528,0.01000,0.235
24,mlp.gate_proj,47.69067764,0.01000,0.222
24,mlp.down_proj,43.55418777,0.01000,0.694
25,self_attn.k_proj,518.00433350,0.01000,0.238
25,self_attn.v_proj,774.28698730,0.01000,0.223
25,self_attn.q_proj,1437.99023438,0.01000,0.224
25,self_attn.o_proj,16.01141739,0.01000,0.464
25,mlp.up_proj,60.59749222,0.01000,0.235
25,mlp.gate_proj,42.82708359,0.01000,0.221
25,mlp.down_proj,52.50085831,0.01000,0.694
26,self_attn.k_proj,481.84396362,0.01000,0.239
26,self_attn.v_proj,666.03979492,0.01000,0.224
26,self_attn.q_proj,1392.31616211,0.01000,0.225
26,self_attn.o_proj,32.51730347,0.01000,0.461
26,mlp.up_proj,63.72230148,0.01000,0.237
26,mlp.gate_proj,45.98903656,0.01000,0.224
26,mlp.down_proj,73.96157837,0.01000,0.696
27,self_attn.k_proj,372.15234375,0.01000,0.240
27,self_attn.v_proj,453.49694824,0.01000,0.224
27,self_attn.q_proj,820.22900391,0.01000,0.225
27,self_attn.o_proj,21.22069931,0.01000,0.464
27,mlp.up_proj,103.78501892,0.01000,0.236
27,mlp.gate_proj,95.20819092,0.01000,0.225
27,mlp.down_proj,89.54586029,0.01000,0.693