zx-modelcloud's picture
Add files using upload-large-folder tool
370a9d9 verified
layer,module,loss,damp,time
0,self_attn.k_proj,1.52977,0.01000,0.419
0,self_attn.v_proj,0.04002,0.01000,0.248
0,self_attn.q_proj,2.05718,0.01000,0.239
0,self_attn.o_proj,0.00179,0.01000,0.248
0,mlp.up_proj,9.05834,0.01000,0.258
0,mlp.gate_proj,8.63545,0.01000,0.244
0,mlp.down_proj,0.19796,0.01000,0.723
1,self_attn.k_proj,0.03884,0.01000,0.267
1,self_attn.v_proj,0.00530,0.01000,0.253
1,self_attn.q_proj,0.03862,0.01000,0.253
1,self_attn.o_proj,0.04960,0.01000,0.250
1,mlp.up_proj,12.92030,0.01000,0.251
1,mlp.gate_proj,14.63847,0.01000,0.241
1,mlp.down_proj,0.32817,0.01000,0.687
3,self_attn.k_proj,62.73893,0.01000,0.254
3,self_attn.v_proj,13.23958,0.01000,0.307
3,self_attn.q_proj,57.28278,0.01000,0.260
3,self_attn.o_proj,0.13773,0.01000,0.245
3,mlp.up_proj,21.15522,0.01000,0.251
3,mlp.gate_proj,24.74686,0.01000,0.243
3,mlp.down_proj,0.53724,0.01000,0.727
4,self_attn.k_proj,68.30590,0.01000,0.263
4,self_attn.v_proj,15.82255,0.01000,0.247
4,self_attn.q_proj,63.01257,0.01000,0.259
4,self_attn.o_proj,0.22000,0.01000,0.242
4,mlp.up_proj,28.74498,0.01000,0.253
4,mlp.gate_proj,33.93200,0.01000,0.245
4,mlp.down_proj,0.65790,0.01000,0.692
5,self_attn.k_proj,60.91286,0.01000,0.271
5,self_attn.v_proj,14.59481,0.01000,0.232
5,self_attn.q_proj,56.24625,0.01000,0.232
5,self_attn.o_proj,0.32792,0.01000,0.248
5,mlp.up_proj,38.43754,0.01000,0.266
5,mlp.gate_proj,44.36505,0.01000,0.245
5,mlp.down_proj,1.13535,0.01000,0.690
6,self_attn.k_proj,60.38514,0.01000,0.246
6,self_attn.v_proj,16.79150,0.01000,0.234
6,self_attn.q_proj,57.52007,0.01000,0.232
6,self_attn.o_proj,0.55901,0.01000,0.293
6,mlp.up_proj,46.22112,0.01000,0.321
6,mlp.gate_proj,52.69062,0.01000,0.237
6,mlp.down_proj,12.85980,0.01000,0.794
7,self_attn.k_proj,68.91588,0.01000,0.244
7,self_attn.v_proj,25.70186,0.01000,0.234
7,self_attn.q_proj,74.04494,0.01000,0.336
7,self_attn.o_proj,0.60068,0.01000,0.296
7,mlp.up_proj,51.54780,0.01000,0.239
7,mlp.gate_proj,56.22544,0.01000,0.232
7,mlp.down_proj,2.15107,0.01000,0.670
8,self_attn.k_proj,63.73604,0.01000,0.250
8,self_attn.v_proj,24.49372,0.01000,0.232
8,self_attn.q_proj,65.13046,0.01000,0.231
8,self_attn.o_proj,0.90025,0.01000,0.237
8,mlp.up_proj,54.74615,0.01000,0.302
8,mlp.gate_proj,58.73801,0.01000,0.246
8,mlp.down_proj,2.61607,0.01000,0.706
9,self_attn.k_proj,68.32961,0.01000,0.322
9,self_attn.v_proj,29.13957,0.01000,0.270
9,self_attn.q_proj,68.92210,0.01000,0.238
9,self_attn.o_proj,1.26286,0.01000,0.245
9,mlp.up_proj,56.97021,0.01000,0.245
9,mlp.gate_proj,57.39296,0.01000,0.230
9,mlp.down_proj,2.88838,0.01000,0.670
10,self_attn.k_proj,77.47882,0.01000,0.247
10,self_attn.v_proj,37.03654,0.01000,0.242
10,self_attn.q_proj,82.30052,0.01000,0.276
10,self_attn.o_proj,1.59611,0.01000,0.258
10,mlp.up_proj,60.05450,0.01000,0.261
10,mlp.gate_proj,63.74242,0.01000,0.233
10,mlp.down_proj,3.57756,0.01000,0.664
11,self_attn.k_proj,76.88316,0.01000,0.302
11,self_attn.v_proj,42.78612,0.01000,0.267
11,self_attn.q_proj,81.16360,0.01000,0.301
11,self_attn.o_proj,1.50892,0.01000,0.335
11,mlp.up_proj,63.83591,0.01000,0.341
11,mlp.gate_proj,65.37469,0.01000,0.296
11,mlp.down_proj,4.61587,0.01000,0.771
12,self_attn.k_proj,77.84145,0.01000,0.249
12,self_attn.v_proj,43.29803,0.01000,0.257
12,self_attn.q_proj,81.49866,0.01000,0.287
12,self_attn.o_proj,2.36211,0.01000,0.259
12,mlp.up_proj,67.92334,0.01000,0.292
12,mlp.gate_proj,68.87761,0.01000,0.303
12,mlp.down_proj,5.67846,0.01000,0.746
13,self_attn.k_proj,78.39484,0.01000,0.267
13,self_attn.v_proj,49.21562,0.01000,0.263
13,self_attn.q_proj,78.76001,0.01000,0.272
13,self_attn.o_proj,2.40954,0.01000,0.254
13,mlp.up_proj,72.61395,0.01000,0.246
13,mlp.gate_proj,72.00835,0.01000,0.236
13,mlp.down_proj,7.55164,0.01000,0.774
14,self_attn.k_proj,85.13994,0.01000,0.242
14,self_attn.v_proj,65.58170,0.01000,0.230
14,self_attn.q_proj,91.41071,0.01000,0.237
14,self_attn.o_proj,3.37462,0.01000,0.240
14,mlp.up_proj,83.58630,0.01000,0.242
14,mlp.gate_proj,80.19814,0.01000,0.232
14,mlp.down_proj,10.20866,0.01000,0.662
15,self_attn.k_proj,82.94417,0.01000,0.244
15,self_attn.v_proj,70.66344,0.01000,0.256
15,self_attn.q_proj,86.81380,0.01000,0.230
15,self_attn.o_proj,3.95524,0.01000,0.236
15,mlp.up_proj,99.12436,0.01000,0.240
15,mlp.gate_proj,92.91805,0.01000,0.286
15,mlp.down_proj,13.83353,0.01000,0.701
16,self_attn.k_proj,88.87656,0.01000,0.244
16,self_attn.v_proj,75.56125,0.01000,0.243
16,self_attn.q_proj,93.78792,0.01000,0.231
16,self_attn.o_proj,3.89123,0.01000,0.239
16,mlp.up_proj,116.95462,0.01000,0.241
16,mlp.gate_proj,109.16769,0.01000,0.233
16,mlp.down_proj,18.61803,0.01000,0.664
17,self_attn.k_proj,88.49626,0.01000,0.244
17,self_attn.v_proj,98.59828,0.01000,0.233
17,self_attn.q_proj,97.10524,0.01000,0.231
17,self_attn.o_proj,5.03318,0.01000,0.238
17,mlp.up_proj,134.24248,0.01000,0.278
17,mlp.gate_proj,125.89964,0.01000,0.247
17,mlp.down_proj,22.90651,0.01000,0.655
18,self_attn.k_proj,91.61066,0.01000,0.253
18,self_attn.v_proj,120.96928,0.01000,0.253
18,self_attn.q_proj,99.53651,0.01000,0.232
18,self_attn.o_proj,8.69388,0.01000,0.236
18,mlp.up_proj,156.05095,0.01000,0.240
18,mlp.gate_proj,139.47502,0.01000,0.232
18,mlp.down_proj,30.87194,0.01000,0.660
19,self_attn.k_proj,96.57993,0.01000,0.241
19,self_attn.v_proj,132.85014,0.01000,0.230
19,self_attn.q_proj,105.32343,0.01000,0.230
19,self_attn.o_proj,9.85187,0.01000,0.270
19,mlp.up_proj,173.96132,0.01000,0.243
19,mlp.gate_proj,152.68323,0.01000,0.232
19,mlp.down_proj,42.00521,0.01000,0.674
20,self_attn.k_proj,101.74275,0.01000,0.276
20,self_attn.v_proj,147.70975,0.01000,0.231
20,self_attn.q_proj,111.28523,0.01000,0.239
20,self_attn.o_proj,8.89061,0.01000,0.244
20,mlp.up_proj,188.34740,0.01000,0.242
20,mlp.gate_proj,161.44333,0.01000,0.234
20,mlp.down_proj,49.47644,0.01000,0.674
21,self_attn.k_proj,104.71509,0.01000,0.254
21,self_attn.v_proj,158.71223,0.01000,0.254
21,self_attn.q_proj,115.99524,0.01000,0.265
21,self_attn.o_proj,12.59802,0.01000,0.241
21,mlp.up_proj,213.42955,0.01000,0.251
21,mlp.gate_proj,180.52798,0.01000,0.282
21,mlp.down_proj,63.05851,0.01000,0.709
22,self_attn.k_proj,96.23979,0.01000,0.243
22,self_attn.v_proj,150.83650,0.01000,0.230
22,self_attn.q_proj,103.43996,0.01000,0.231
22,self_attn.o_proj,18.46274,0.01000,0.235
22,mlp.up_proj,230.47380,0.01000,0.239
22,mlp.gate_proj,198.01071,0.01000,0.232
22,mlp.down_proj,76.59824,0.01000,0.658
23,self_attn.k_proj,99.04884,0.01000,0.241
23,self_attn.v_proj,149.65315,0.01000,0.230
23,self_attn.q_proj,97.98630,0.01000,0.258
23,self_attn.o_proj,30.47421,0.01000,0.298
23,mlp.up_proj,256.14508,0.01000,0.253
23,mlp.gate_proj,221.90912,0.01000,0.232
23,mlp.down_proj,158.18503,0.01000,0.668
24,lm_head,132.93503,0.01000,3.311