File size: 6,822 Bytes
d784d77
370a9d9
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
layer,module,loss,damp,time
0,self_attn.k_proj,1.52977,0.01000,0.419
0,self_attn.v_proj,0.04002,0.01000,0.248
0,self_attn.q_proj,2.05718,0.01000,0.239
0,self_attn.o_proj,0.00179,0.01000,0.248
0,mlp.up_proj,9.05834,0.01000,0.258
0,mlp.gate_proj,8.63545,0.01000,0.244
0,mlp.down_proj,0.19796,0.01000,0.723
1,self_attn.k_proj,0.03884,0.01000,0.267
1,self_attn.v_proj,0.00530,0.01000,0.253
1,self_attn.q_proj,0.03862,0.01000,0.253
1,self_attn.o_proj,0.04960,0.01000,0.250
1,mlp.up_proj,12.92030,0.01000,0.251
1,mlp.gate_proj,14.63847,0.01000,0.241
1,mlp.down_proj,0.32817,0.01000,0.687
3,self_attn.k_proj,62.73893,0.01000,0.254
3,self_attn.v_proj,13.23958,0.01000,0.307
3,self_attn.q_proj,57.28278,0.01000,0.260
3,self_attn.o_proj,0.13773,0.01000,0.245
3,mlp.up_proj,21.15522,0.01000,0.251
3,mlp.gate_proj,24.74686,0.01000,0.243
3,mlp.down_proj,0.53724,0.01000,0.727
4,self_attn.k_proj,68.30590,0.01000,0.263
4,self_attn.v_proj,15.82255,0.01000,0.247
4,self_attn.q_proj,63.01257,0.01000,0.259
4,self_attn.o_proj,0.22000,0.01000,0.242
4,mlp.up_proj,28.74498,0.01000,0.253
4,mlp.gate_proj,33.93200,0.01000,0.245
4,mlp.down_proj,0.65790,0.01000,0.692
5,self_attn.k_proj,60.91286,0.01000,0.271
5,self_attn.v_proj,14.59481,0.01000,0.232
5,self_attn.q_proj,56.24625,0.01000,0.232
5,self_attn.o_proj,0.32792,0.01000,0.248
5,mlp.up_proj,38.43754,0.01000,0.266
5,mlp.gate_proj,44.36505,0.01000,0.245
5,mlp.down_proj,1.13535,0.01000,0.690
6,self_attn.k_proj,60.38514,0.01000,0.246
6,self_attn.v_proj,16.79150,0.01000,0.234
6,self_attn.q_proj,57.52007,0.01000,0.232
6,self_attn.o_proj,0.55901,0.01000,0.293
6,mlp.up_proj,46.22112,0.01000,0.321
6,mlp.gate_proj,52.69062,0.01000,0.237
6,mlp.down_proj,12.85980,0.01000,0.794
7,self_attn.k_proj,68.91588,0.01000,0.244
7,self_attn.v_proj,25.70186,0.01000,0.234
7,self_attn.q_proj,74.04494,0.01000,0.336
7,self_attn.o_proj,0.60068,0.01000,0.296
7,mlp.up_proj,51.54780,0.01000,0.239
7,mlp.gate_proj,56.22544,0.01000,0.232
7,mlp.down_proj,2.15107,0.01000,0.670
8,self_attn.k_proj,63.73604,0.01000,0.250
8,self_attn.v_proj,24.49372,0.01000,0.232
8,self_attn.q_proj,65.13046,0.01000,0.231
8,self_attn.o_proj,0.90025,0.01000,0.237
8,mlp.up_proj,54.74615,0.01000,0.302
8,mlp.gate_proj,58.73801,0.01000,0.246
8,mlp.down_proj,2.61607,0.01000,0.706
9,self_attn.k_proj,68.32961,0.01000,0.322
9,self_attn.v_proj,29.13957,0.01000,0.270
9,self_attn.q_proj,68.92210,0.01000,0.238
9,self_attn.o_proj,1.26286,0.01000,0.245
9,mlp.up_proj,56.97021,0.01000,0.245
9,mlp.gate_proj,57.39296,0.01000,0.230
9,mlp.down_proj,2.88838,0.01000,0.670
10,self_attn.k_proj,77.47882,0.01000,0.247
10,self_attn.v_proj,37.03654,0.01000,0.242
10,self_attn.q_proj,82.30052,0.01000,0.276
10,self_attn.o_proj,1.59611,0.01000,0.258
10,mlp.up_proj,60.05450,0.01000,0.261
10,mlp.gate_proj,63.74242,0.01000,0.233
10,mlp.down_proj,3.57756,0.01000,0.664
11,self_attn.k_proj,76.88316,0.01000,0.302
11,self_attn.v_proj,42.78612,0.01000,0.267
11,self_attn.q_proj,81.16360,0.01000,0.301
11,self_attn.o_proj,1.50892,0.01000,0.335
11,mlp.up_proj,63.83591,0.01000,0.341
11,mlp.gate_proj,65.37469,0.01000,0.296
11,mlp.down_proj,4.61587,0.01000,0.771
12,self_attn.k_proj,77.84145,0.01000,0.249
12,self_attn.v_proj,43.29803,0.01000,0.257
12,self_attn.q_proj,81.49866,0.01000,0.287
12,self_attn.o_proj,2.36211,0.01000,0.259
12,mlp.up_proj,67.92334,0.01000,0.292
12,mlp.gate_proj,68.87761,0.01000,0.303
12,mlp.down_proj,5.67846,0.01000,0.746
13,self_attn.k_proj,78.39484,0.01000,0.267
13,self_attn.v_proj,49.21562,0.01000,0.263
13,self_attn.q_proj,78.76001,0.01000,0.272
13,self_attn.o_proj,2.40954,0.01000,0.254
13,mlp.up_proj,72.61395,0.01000,0.246
13,mlp.gate_proj,72.00835,0.01000,0.236
13,mlp.down_proj,7.55164,0.01000,0.774
14,self_attn.k_proj,85.13994,0.01000,0.242
14,self_attn.v_proj,65.58170,0.01000,0.230
14,self_attn.q_proj,91.41071,0.01000,0.237
14,self_attn.o_proj,3.37462,0.01000,0.240
14,mlp.up_proj,83.58630,0.01000,0.242
14,mlp.gate_proj,80.19814,0.01000,0.232
14,mlp.down_proj,10.20866,0.01000,0.662
15,self_attn.k_proj,82.94417,0.01000,0.244
15,self_attn.v_proj,70.66344,0.01000,0.256
15,self_attn.q_proj,86.81380,0.01000,0.230
15,self_attn.o_proj,3.95524,0.01000,0.236
15,mlp.up_proj,99.12436,0.01000,0.240
15,mlp.gate_proj,92.91805,0.01000,0.286
15,mlp.down_proj,13.83353,0.01000,0.701
16,self_attn.k_proj,88.87656,0.01000,0.244
16,self_attn.v_proj,75.56125,0.01000,0.243
16,self_attn.q_proj,93.78792,0.01000,0.231
16,self_attn.o_proj,3.89123,0.01000,0.239
16,mlp.up_proj,116.95462,0.01000,0.241
16,mlp.gate_proj,109.16769,0.01000,0.233
16,mlp.down_proj,18.61803,0.01000,0.664
17,self_attn.k_proj,88.49626,0.01000,0.244
17,self_attn.v_proj,98.59828,0.01000,0.233
17,self_attn.q_proj,97.10524,0.01000,0.231
17,self_attn.o_proj,5.03318,0.01000,0.238
17,mlp.up_proj,134.24248,0.01000,0.278
17,mlp.gate_proj,125.89964,0.01000,0.247
17,mlp.down_proj,22.90651,0.01000,0.655
18,self_attn.k_proj,91.61066,0.01000,0.253
18,self_attn.v_proj,120.96928,0.01000,0.253
18,self_attn.q_proj,99.53651,0.01000,0.232
18,self_attn.o_proj,8.69388,0.01000,0.236
18,mlp.up_proj,156.05095,0.01000,0.240
18,mlp.gate_proj,139.47502,0.01000,0.232
18,mlp.down_proj,30.87194,0.01000,0.660
19,self_attn.k_proj,96.57993,0.01000,0.241
19,self_attn.v_proj,132.85014,0.01000,0.230
19,self_attn.q_proj,105.32343,0.01000,0.230
19,self_attn.o_proj,9.85187,0.01000,0.270
19,mlp.up_proj,173.96132,0.01000,0.243
19,mlp.gate_proj,152.68323,0.01000,0.232
19,mlp.down_proj,42.00521,0.01000,0.674
20,self_attn.k_proj,101.74275,0.01000,0.276
20,self_attn.v_proj,147.70975,0.01000,0.231
20,self_attn.q_proj,111.28523,0.01000,0.239
20,self_attn.o_proj,8.89061,0.01000,0.244
20,mlp.up_proj,188.34740,0.01000,0.242
20,mlp.gate_proj,161.44333,0.01000,0.234
20,mlp.down_proj,49.47644,0.01000,0.674
21,self_attn.k_proj,104.71509,0.01000,0.254
21,self_attn.v_proj,158.71223,0.01000,0.254
21,self_attn.q_proj,115.99524,0.01000,0.265
21,self_attn.o_proj,12.59802,0.01000,0.241
21,mlp.up_proj,213.42955,0.01000,0.251
21,mlp.gate_proj,180.52798,0.01000,0.282
21,mlp.down_proj,63.05851,0.01000,0.709
22,self_attn.k_proj,96.23979,0.01000,0.243
22,self_attn.v_proj,150.83650,0.01000,0.230
22,self_attn.q_proj,103.43996,0.01000,0.231
22,self_attn.o_proj,18.46274,0.01000,0.235
22,mlp.up_proj,230.47380,0.01000,0.239
22,mlp.gate_proj,198.01071,0.01000,0.232
22,mlp.down_proj,76.59824,0.01000,0.658
23,self_attn.k_proj,99.04884,0.01000,0.241
23,self_attn.v_proj,149.65315,0.01000,0.230
23,self_attn.q_proj,97.98630,0.01000,0.258
23,self_attn.o_proj,30.47421,0.01000,0.298
23,mlp.up_proj,256.14508,0.01000,0.253
23,mlp.gate_proj,221.90912,0.01000,0.232
23,mlp.down_proj,158.18503,0.01000,0.668
24,lm_head,132.93503,0.01000,3.311