Commit
·
1e33f3e
1
Parent(s):
e42c1df
Upload part 45
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +52 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray.__tmp10073661389214073732.~1663960300886449~ +1 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray.__tmp14811671144810604280.~1663960300729667~ +1 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray.__tmp1725700251694505214.~1663960300420073~ +1 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/1.0 +3 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/2.0 +3 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/3.0 +3 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/4.0 +3 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/5.0 +3 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/6.0 +3 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/7.0 +3 -0
- checkpoint_1007000/target.decoder.layers_19.pre_cross_attention_layer_norm.scale/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_19.pre_cross_attention_layer_norm.scale/0 +0 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray.__tmp11807813215046036505.~1663960300385727~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray.__tmp13611715367022834661.~1663960300774432~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray.__tmp4630577611859278728.~1663960300730147~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray.__tmp5344318709221343471.~1663960300421510~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray.__tmp6005823555080937686.~1663960300546868~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray.__tmp7800724356086543668.~1663960300686913~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray.__tmp8469731595145937744.~1663960300471673~ +1 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray.__tmp228878645978238791.~1663960300421217~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray.__tmp2515899432506933413.~1663960300622371~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray.__tmp4401067149692269771.~1663960300940912~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray.__tmp5891776655746718169.~1663960300686376~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray.__tmp82471505265950557.~1663960300548418~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray.__tmp8439650670007955153.~1663960300549010~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray.__tmp9155945814913170872.~1663960300466135~ +1 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_3.pre_self_attention_layer_norm.scale/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_3.pre_self_attention_layer_norm.scale/0 +0 -0
- checkpoint_1007000/target.decoder.layers_3.self_attention.query.kernel/.zarray +1 -0
.gitattributes
CHANGED
@@ -2287,3 +2287,55 @@ checkpoint_1007000/target.encoder.layers_12.mlp.wi_0.kernel/0.1 filter=lfs diff=
|
|
2287 |
checkpoint_1007000/target.encoder.layers_12.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
2288 |
checkpoint_1007000/target.encoder.layers_12.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2289 |
checkpoint_1007000/target.encoder.layers_12.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2287 |
checkpoint_1007000/target.encoder.layers_12.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
2288 |
checkpoint_1007000/target.encoder.layers_12.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2289 |
checkpoint_1007000/target.encoder.layers_12.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
2290 |
+
checkpoint_1007000/target.encoder.layers_12.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
2291 |
+
checkpoint_1007000/target.encoder.layers_12.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
2292 |
+
checkpoint_1007000/target.encoder.layers_12.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
2293 |
+
checkpoint_1007000/target.encoder.layers_12.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
2294 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
2295 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
2296 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2297 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
2298 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
2299 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
2300 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
2301 |
+
checkpoint_1007000/target.decoder.layers_3.self_attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
2302 |
+
checkpoint_1007000/target.encoder.layers_15.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
2303 |
+
checkpoint_1007000/target.encoder.layers_15.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
2304 |
+
checkpoint_1007000/target.encoder.layers_15.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
2305 |
+
checkpoint_1007000/target.encoder.layers_15.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2306 |
+
checkpoint_1007000/target.encoder.layers_15.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
2307 |
+
checkpoint_1007000/target.encoder.layers_15.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
2308 |
+
checkpoint_1007000/target.encoder.layers_15.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
2309 |
+
checkpoint_1007000/target.encoder.layers_15.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
2310 |
+
checkpoint_1007000/target.encoder.layers_16.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
2311 |
+
checkpoint_1007000/target.encoder.layers_16.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
2312 |
+
checkpoint_1007000/target.encoder.layers_16.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2313 |
+
checkpoint_1007000/target.encoder.layers_16.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
2314 |
+
checkpoint_1007000/target.encoder.layers_16.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
2315 |
+
checkpoint_1007000/target.encoder.layers_16.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
2316 |
+
checkpoint_1007000/target.encoder.layers_16.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
2317 |
+
checkpoint_1007000/target.encoder.layers_16.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
2318 |
+
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
2319 |
+
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
2320 |
+
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2321 |
+
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
2322 |
+
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
2323 |
+
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
2324 |
+
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
2325 |
+
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
2326 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
2327 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
2328 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2329 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
2330 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
2331 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
2332 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
2333 |
+
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
2334 |
+
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
2335 |
+
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
2336 |
+
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
2337 |
+
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2338 |
+
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
2339 |
+
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
2340 |
+
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
2341 |
+
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray.__tmp10073661389214073732.~1663960300886449~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray.__tmp14811671144810604280.~1663960300729667~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray.__tmp1725700251694505214.~1663960300420073~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9b36c6f8f72ea934c89282b5516fd5e12cb7ea6ca491f3b35ac1df12d9d11978
|
3 |
+
size 19546888
|
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/1.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f14cafa4d3719bd27f2cba59a014bead7ab442623666d920d5174af6e9f75d3
|
3 |
+
size 19546010
|
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/2.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:48999c6a40b05f3a77500b6d86c06b47ec8199733beac59b4f822a5480cbe165
|
3 |
+
size 19547174
|
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/3.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1857de19f2bdf58afb75b9c315678451c81551dcf66d2aa56e0d195940258d87
|
3 |
+
size 19547081
|
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/4.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fdd4f8e0865ffd0c0bdb16b31c16502c1f26edb1b96d9087c32ce660726c02e4
|
3 |
+
size 19547230
|
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/5.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e492f130a8534733f81b87ce3b0989ecdd6e38591e6651d8fc39c0a26e1b50cd
|
3 |
+
size 19546681
|
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/6.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:32d623d14bcdf4e2eedf5dfcb48dafb9ce9d7b0fc7a153ce31918d54f5a56f0e
|
3 |
+
size 19545821
|
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/7.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc1e556afae7fe3880c311cb98022d6116656482319b1335dda740300ddaf569
|
3 |
+
size 19547547
|
checkpoint_1007000/target.decoder.layers_19.pre_cross_attention_layer_norm.scale/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_19.pre_cross_attention_layer_norm.scale/0
ADDED
Binary file (14.6 kB). View file
|
|
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray.__tmp11807813215046036505.~1663960300385727~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray.__tmp13611715367022834661.~1663960300774432~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray.__tmp4630577611859278728.~1663960300730147~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray.__tmp5344318709221343471.~1663960300421510~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray.__tmp6005823555080937686.~1663960300546868~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray.__tmp7800724356086543668.~1663960300686913~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/.zarray.__tmp8469731595145937744.~1663960300471673~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0f1ac5351ab35a3462f72974a439a41776094b50df5a2838c33e947fd1468b37
|
3 |
+
size 7802802
|
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:56881cb0f2687fadc435fa86fcedeb74920e5b7ec3f028c15dcaa94c0c4a09c1
|
3 |
+
size 7801935
|
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cfa47de544dc1e0be2e0ad47262cac5e2c13abff7335b04d3a15d28ce80cf84e
|
3 |
+
size 7801740
|
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bcb24fccabc51662ee118c80f340393a348b0bd59b97906e6e520ed9a08618e7
|
3 |
+
size 7803749
|
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe66779f2212c0efbbe84a04b9b277b1db4fdaf34b77a4e5a0e355c5caddb20a
|
3 |
+
size 7806466
|
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:367dd12f1f9baa30bc5c55d301ee2abc3a9e79ccf310af1323960c9c4639f30e
|
3 |
+
size 7804543
|
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ebfd38ca78610067edc7b5e078714265533cf37d7581aff38782f226c5b470e
|
3 |
+
size 7803577
|
checkpoint_1007000/target.decoder.layers_23.self_attention.query.kernel/0.7
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e974a60e17aab0e0c8d717106cfced86a6a7e36d4df93beb42e7a3cff4bb2448
|
3 |
+
size 7802433
|
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray.__tmp228878645978238791.~1663960300421217~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray.__tmp2515899432506933413.~1663960300622371~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray.__tmp4401067149692269771.~1663960300940912~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray.__tmp5891776655746718169.~1663960300686376~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray.__tmp82471505265950557.~1663960300548418~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray.__tmp8439650670007955153.~1663960300549010~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/.zarray.__tmp9155945814913170872.~1663960300466135~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f8f44f6d8fa9c446364360e804d62cfe7ed3cba582c39cf6bfd324883892adb7
|
3 |
+
size 19557369
|
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ca701d2ce76b828a3e14cd37ead2df98681cd7989591bb6b7f89005edfb436f
|
3 |
+
size 19556302
|
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:962ec9bb9370ed6ab7b563df5d6535ddf3886db4d8171eb566af3df98e75017f
|
3 |
+
size 19556681
|
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:91d9740cb88d270f50961d8b43d4a3a61a2846469654eeb890b5b52bea020343
|
3 |
+
size 19562668
|
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:efa0e651f9932f016d5406d168adf9f2a2ea07bbe9e1180b3cdaf7dc7641b0ad
|
3 |
+
size 19555460
|
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2853ae42115fbfe70f940ffe9633159261edc1077ee185e645a40988ae35c23c
|
3 |
+
size 19555683
|
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e5d707e7e7d44b3f8667b5e525bc486b1c3ff7f8665e988a0c1e06ea756d8389
|
3 |
+
size 19556874
|
checkpoint_1007000/target.decoder.layers_3.mlp.wi_0.kernel/0.7
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b0b7428b82b1d7dd01cc3d6597b2547a2c1e5516815fc26508c330ab5c25ae83
|
3 |
+
size 19557631
|
checkpoint_1007000/target.decoder.layers_3.pre_self_attention_layer_norm.scale/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.pre_self_attention_layer_norm.scale/0
ADDED
Binary file (14.9 kB). View file
|
|
checkpoint_1007000/target.decoder.layers_3.self_attention.query.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|