TimeRobber commited on
Commit
1e33f3e
·
1 Parent(s): e42c1df

Upload part 45

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +52 -0
  2. checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray +1 -0
  3. checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray.__tmp10073661389214073732.~1663960300886449~ +1 -0
  4. checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray.__tmp14811671144810604280.~1663960300729667~ +1 -0
  5. checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray.__tmp1725700251694505214.~1663960300420073~ +1 -0
  6. checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/0.0 +3 -0
  7. checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/1.0 +3 -0
  8. checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/2.0 +3 -0
  9. checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/3.0 +3 -0
  10. checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/4.0 +3 -0
  11. checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/5.0 +3 -0
  12. checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/6.0 +3 -0
  13. checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/7.0 +3 -0
  14. checkpoint_1007000/target.decoder.layers_19.pre_cross_attention_layer_norm.scale/.zarray +1 -0
  15. checkpoint_1007000/target.decoder.layers_19.pre_cross_attention_layer_norm.scale/0 +0 -0
  16. checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray +1 -0
  17. checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray.__tmp11807813215046036505.~1663960300385727~ +1 -0
  18. checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray.__tmp13611715367022834661.~1663960300774432~ +1 -0
  19. checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray.__tmp4630577611859278728.~1663960300730147~ +1 -0
  20. checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray.__tmp5344318709221343471.~1663960300421510~ +1 -0
  21. checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray.__tmp6005823555080937686.~1663960300546868~ +1 -0
  22. checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray.__tmp7800724356086543668.~1663960300686913~ +1 -0
  23. checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray.__tmp8469731595145937744.~1663960300471673~ +1 -0
  24. checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.0 +3 -0
  25. checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.1 +3 -0
  26. checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.2 +3 -0
  27. checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.3 +3 -0
  28. checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.4 +3 -0
  29. checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.5 +3 -0
  30. checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.6 +3 -0
  31. checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.7 +3 -0
  32. checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray +1 -0
  33. checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray.__tmp228878645978238791.~1663960300421217~ +1 -0
  34. checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray.__tmp2515899432506933413.~1663960300622371~ +1 -0
  35. checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray.__tmp4401067149692269771.~1663960300940912~ +1 -0
  36. checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray.__tmp5891776655746718169.~1663960300686376~ +1 -0
  37. checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray.__tmp82471505265950557.~1663960300548418~ +1 -0
  38. checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray.__tmp8439650670007955153.~1663960300549010~ +1 -0
  39. checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray.__tmp9155945814913170872.~1663960300466135~ +1 -0
  40. checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.0 +3 -0
  41. checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.1 +3 -0
  42. checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.2 +3 -0
  43. checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.3 +3 -0
  44. checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.4 +3 -0
  45. checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.5 +3 -0
  46. checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.6 +3 -0
  47. checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.7 +3 -0
  48. checkpoint_1007000/target.decoder.layers_3.pre_self_attention_layer_norm.scale/.zarray +1 -0
  49. checkpoint_1007000/target.decoder.layers_3.pre_self_attention_layer_norm.scale/0 +0 -0
  50. checkpoint_1007000/target.decoder.layers_3.self_attention.query.kernel/.zarray +1 -0
.gitattributes CHANGED
@@ -2287,3 +2287,55 @@ checkpoint_1007000/target.encoder.layers_12.mlp.wi_0.kernel/0.1 filter=lfs diff=
2287
  checkpoint_1007000/target.encoder.layers_12.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2288
  checkpoint_1007000/target.encoder.layers_12.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2289
  checkpoint_1007000/target.encoder.layers_12.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2287
  checkpoint_1007000/target.encoder.layers_12.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2288
  checkpoint_1007000/target.encoder.layers_12.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2289
  checkpoint_1007000/target.encoder.layers_12.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
2290
+ checkpoint_1007000/target.encoder.layers_12.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
2291
+ checkpoint_1007000/target.encoder.layers_12.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
2292
+ checkpoint_1007000/target.encoder.layers_12.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
2293
+ checkpoint_1007000/target.encoder.layers_12.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2294
+ checkpoint_1007000/target.decoder.layers_3.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
2295
+ checkpoint_1007000/target.decoder.layers_3.self_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2296
+ checkpoint_1007000/target.decoder.layers_3.self_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2297
+ checkpoint_1007000/target.decoder.layers_3.self_attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
2298
+ checkpoint_1007000/target.decoder.layers_3.self_attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
2299
+ checkpoint_1007000/target.decoder.layers_3.self_attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
2300
+ checkpoint_1007000/target.decoder.layers_3.self_attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
2301
+ checkpoint_1007000/target.decoder.layers_3.self_attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2302
+ checkpoint_1007000/target.encoder.layers_15.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
2303
+ checkpoint_1007000/target.encoder.layers_15.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
2304
+ checkpoint_1007000/target.encoder.layers_15.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
2305
+ checkpoint_1007000/target.encoder.layers_15.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2306
+ checkpoint_1007000/target.encoder.layers_15.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
2307
+ checkpoint_1007000/target.encoder.layers_15.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
2308
+ checkpoint_1007000/target.encoder.layers_15.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
2309
+ checkpoint_1007000/target.encoder.layers_15.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
2310
+ checkpoint_1007000/target.encoder.layers_16.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
2311
+ checkpoint_1007000/target.encoder.layers_16.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2312
+ checkpoint_1007000/target.encoder.layers_16.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2313
+ checkpoint_1007000/target.encoder.layers_16.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
2314
+ checkpoint_1007000/target.encoder.layers_16.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
2315
+ checkpoint_1007000/target.encoder.layers_16.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
2316
+ checkpoint_1007000/target.encoder.layers_16.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
2317
+ checkpoint_1007000/target.encoder.layers_16.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2318
+ checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
2319
+ checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2320
+ checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2321
+ checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
2322
+ checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
2323
+ checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
2324
+ checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
2325
+ checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2326
+ checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
2327
+ checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2328
+ checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2329
+ checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
2330
+ checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
2331
+ checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
2332
+ checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
2333
+ checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2334
+ checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
2335
+ checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
2336
+ checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
2337
+ checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2338
+ checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
2339
+ checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
2340
+ checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
2341
+ checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray.__tmp10073661389214073732.~1663960300886449~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray.__tmp14811671144810604280.~1663960300729667~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray.__tmp1725700251694505214.~1663960300420073~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b36c6f8f72ea934c89282b5516fd5e12cb7ea6ca491f3b35ac1df12d9d11978
3
+ size 19546888
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/1.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f14cafa4d3719bd27f2cba59a014bead7ab442623666d920d5174af6e9f75d3
3
+ size 19546010
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/2.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48999c6a40b05f3a77500b6d86c06b47ec8199733beac59b4f822a5480cbe165
3
+ size 19547174
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/3.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1857de19f2bdf58afb75b9c315678451c81551dcf66d2aa56e0d195940258d87
3
+ size 19547081
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/4.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fdd4f8e0865ffd0c0bdb16b31c16502c1f26edb1b96d9087c32ce660726c02e4
3
+ size 19547230
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/5.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e492f130a8534733f81b87ce3b0989ecdd6e38591e6651d8fc39c0a26e1b50cd
3
+ size 19546681
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/6.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32d623d14bcdf4e2eedf5dfcb48dafb9ce9d7b0fc7a153ce31918d54f5a56f0e
3
+ size 19545821
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/7.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc1e556afae7fe3880c311cb98022d6116656482319b1335dda740300ddaf569
3
+ size 19547547
checkpoint_1007000/target.decoder.layers_19.pre_cross_attention_layer_norm.scale/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_19.pre_cross_attention_layer_norm.scale/0 ADDED
Binary file (14.6 kB). View file
 
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray.__tmp11807813215046036505.~1663960300385727~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray.__tmp13611715367022834661.~1663960300774432~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray.__tmp4630577611859278728.~1663960300730147~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray.__tmp5344318709221343471.~1663960300421510~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray.__tmp6005823555080937686.~1663960300546868~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray.__tmp7800724356086543668.~1663960300686913~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray.__tmp8469731595145937744.~1663960300471673~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f1ac5351ab35a3462f72974a439a41776094b50df5a2838c33e947fd1468b37
3
+ size 7802802
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56881cb0f2687fadc435fa86fcedeb74920e5b7ec3f028c15dcaa94c0c4a09c1
3
+ size 7801935
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfa47de544dc1e0be2e0ad47262cac5e2c13abff7335b04d3a15d28ce80cf84e
3
+ size 7801740
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bcb24fccabc51662ee118c80f340393a348b0bd59b97906e6e520ed9a08618e7
3
+ size 7803749
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe66779f2212c0efbbe84a04b9b277b1db4fdaf34b77a4e5a0e355c5caddb20a
3
+ size 7806466
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:367dd12f1f9baa30bc5c55d301ee2abc3a9e79ccf310af1323960c9c4639f30e
3
+ size 7804543
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ebfd38ca78610067edc7b5e078714265533cf37d7581aff38782f226c5b470e
3
+ size 7803577
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e974a60e17aab0e0c8d717106cfced86a6a7e36d4df93beb42e7a3cff4bb2448
3
+ size 7802433
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray.__tmp228878645978238791.~1663960300421217~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray.__tmp2515899432506933413.~1663960300622371~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray.__tmp4401067149692269771.~1663960300940912~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray.__tmp5891776655746718169.~1663960300686376~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray.__tmp82471505265950557.~1663960300548418~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray.__tmp8439650670007955153.~1663960300549010~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray.__tmp9155945814913170872.~1663960300466135~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8f44f6d8fa9c446364360e804d62cfe7ed3cba582c39cf6bfd324883892adb7
3
+ size 19557369
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ca701d2ce76b828a3e14cd37ead2df98681cd7989591bb6b7f89005edfb436f
3
+ size 19556302
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:962ec9bb9370ed6ab7b563df5d6535ddf3886db4d8171eb566af3df98e75017f
3
+ size 19556681
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91d9740cb88d270f50961d8b43d4a3a61a2846469654eeb890b5b52bea020343
3
+ size 19562668
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efa0e651f9932f016d5406d168adf9f2a2ea07bbe9e1180b3cdaf7dc7641b0ad
3
+ size 19555460
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2853ae42115fbfe70f940ffe9633159261edc1077ee185e645a40988ae35c23c
3
+ size 19555683
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5d707e7e7d44b3f8667b5e525bc486b1c3ff7f8665e988a0c1e06ea756d8389
3
+ size 19556874
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0b7428b82b1d7dd01cc3d6597b2547a2c1e5516815fc26508c330ab5c25ae83
3
+ size 19557631
checkpoint_1007000/target.decoder.layers_3.pre_self_attention_layer_norm.scale/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_3.pre_self_attention_layer_norm.scale/0 ADDED
Binary file (14.9 kB). View file
 
checkpoint_1007000/target.decoder.layers_3.self_attention.query.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}