Commit
·
fec22c9
1
Parent(s):
563d6f7
Upload part 23
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +50 -0
- checkpoint_1007000/state.param_states.decoder.layers_7.pre_self_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_7.pre_self_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/target.decoder.layers_1.pre_cross_attention_layer_norm.scale/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_1.pre_cross_attention_layer_norm.scale/0 +0 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/.zarray.__tmp10296302854619443759.~1663960301028866~ +1 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/.zarray.__tmp10672326537729832160.~1663960300016902~ +1 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/.zarray.__tmp4323493746792918827.~1663960300272062~ +1 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/.zarray.__tmp6187696939640315561.~1663960300133222~ +1 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/.zarray.__tmp7819897597393638482.~1663960300070802~ +1 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/.zarray.__tmp13235743666992055771.~1663960300610861~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/.zarray.__tmp245554725322020391.~1663960300986637~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/.zarray.__tmp7081703532691619183.~1663960300553725~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/.zarray.__tmp9130579545580510080.~1663960300461979~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/.zarray.__tmp9387726656363656464.~1663960300940800~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/.zarray.__tmp10328583312988144199.~1663960300551647~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/.zarray.__tmp13797936759071255094.~1663960300347902~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/.zarray.__tmp13986472075519930249.~1663960300685650~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/.zarray.__tmp1467584061988000765.~1663960300385708~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/.zarray.__tmp16591741030595486867.~1663960300823709~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/.zarray.__tmp18283481202771270668.~1663960300496415~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/.zarray.__tmp4823703594089859210.~1663960300603078~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.out.kernel/.zarray.__tmp112152727729513876.~1663960300491658~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.out.kernel/.zarray.__tmp6303835615061701227.~1663960300599592~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.out.kernel/0.0 +3 -0
.gitattributes
CHANGED
@@ -1197,3 +1197,53 @@ checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/0.2 filter
|
|
1197 |
checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
1198 |
checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
1199 |
checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1197 |
checkpoint_1007000/target.decoder.layers_14.self_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
1198 |
checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
1199 |
checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
1200 |
+
checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
1201 |
+
checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
1202 |
+
checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
1203 |
+
checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
1204 |
+
checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
1205 |
+
checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
1206 |
+
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
1207 |
+
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
1208 |
+
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
1209 |
+
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
1210 |
+
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
1211 |
+
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
1212 |
+
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
1213 |
+
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
1214 |
+
checkpoint_1007000/target.encoder.layers_5.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
1215 |
+
checkpoint_1007000/target.encoder.layers_5.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
1216 |
+
checkpoint_1007000/target.encoder.layers_5.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
1217 |
+
checkpoint_1007000/target.encoder.layers_5.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
1218 |
+
checkpoint_1007000/target.encoder.layers_5.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
1219 |
+
checkpoint_1007000/target.encoder.layers_5.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
1220 |
+
checkpoint_1007000/target.encoder.layers_5.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
1221 |
+
checkpoint_1007000/target.encoder.layers_5.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
1222 |
+
checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
1223 |
+
checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
1224 |
+
checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
1225 |
+
checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
1226 |
+
checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
1227 |
+
checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
1228 |
+
checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
1229 |
+
checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
1230 |
+
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
1231 |
+
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
1232 |
+
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
1233 |
+
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
1234 |
+
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
1235 |
+
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
1236 |
+
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
1237 |
+
checkpoint_1007000/target.decoder.layers_9.encoder_decoder_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
1238 |
+
checkpoint_1007000/target.encoder.layers_10.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
1239 |
+
checkpoint_1007000/target.encoder.layers_10.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
1240 |
+
checkpoint_1007000/target.encoder.layers_10.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
1241 |
+
checkpoint_1007000/target.encoder.layers_10.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
1242 |
+
checkpoint_1007000/target.encoder.layers_10.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
1243 |
+
checkpoint_1007000/target.encoder.layers_10.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
1244 |
+
checkpoint_1007000/target.encoder.layers_10.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
1245 |
+
checkpoint_1007000/target.encoder.layers_10.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
1246 |
+
checkpoint_1007000/target.decoder.layers_20.self_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
1247 |
+
checkpoint_1007000/target.decoder.layers_20.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
1248 |
+
checkpoint_1007000/target.decoder.layers_20.self_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
1249 |
+
checkpoint_1007000/target.decoder.layers_20.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/state.param_states.decoder.layers_7.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_7.pre_self_attention_layer_norm.scale.v/0
ADDED
Binary file (15.1 kB). View file
|
|
checkpoint_1007000/target.decoder.layers_1.pre_cross_attention_layer_norm.scale/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.pre_cross_attention_layer_norm.scale/0
ADDED
Binary file (15.1 kB). View file
|
|
checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/.zarray.__tmp10296302854619443759.~1663960301028866~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/.zarray.__tmp10672326537729832160.~1663960300016902~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/.zarray.__tmp4323493746792918827.~1663960300272062~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/.zarray.__tmp6187696939640315561.~1663960300133222~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/.zarray.__tmp7819897597393638482.~1663960300070802~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:88c2248796d38d3ed5a13a52980350b72ab9388cf6a57eec6aff1fc4754bae45
|
3 |
+
size 7811928
|
checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/0.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ad41cc3d897229d81ed6b5272a93cb174586e6f3dba87e98b85e4923e628f71
|
3 |
+
size 7804441
|
checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/0.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3ae395fac0522f60df3bf4054a457a1863358bf46cc550b1c0b3c9c3b0d5f97
|
3 |
+
size 7803857
|
checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/0.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:72b5f8e3530862d81e0729a1b9fc015989511091b9a9faae9d93bd8a9c8bf0e6
|
3 |
+
size 7804800
|
checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/0.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ee558c944fbdb74408382104e96dc00e53e19e5e1f7fa87a56033fa73c0e341
|
3 |
+
size 7803569
|
checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/0.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09d6097a92bb8893f025754ae14be88206b9ad27a1b1a611ef9be9d9bfa24689
|
3 |
+
size 7805132
|
checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/0.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a93f11a0651f8b87ddcde49f8c94bbf775ede4f3726fdfe6e0c13eac4dd5fff
|
3 |
+
size 7802981
|
checkpoint_1007000/target.decoder.layers_1.self_attention.query.kernel/0.7
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd495784098d43cba5426e4948fc9583e2f4d11d329dd8ad6d0b18bfaf93ad7e
|
3 |
+
size 7804331
|
checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/.zarray.__tmp13235743666992055771.~1663960300610861~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/.zarray.__tmp245554725322020391.~1663960300986637~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/.zarray.__tmp7081703532691619183.~1663960300553725~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/.zarray.__tmp9130579545580510080.~1663960300461979~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/.zarray.__tmp9387726656363656464.~1663960300940800~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:89935e0362f769922a22444be6e63fb0d3d4c69cfbfb3769174bf46de2dd4b94
|
3 |
+
size 7806982
|
checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/0.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9b7c6cf508f80ffa4d62590b847d030c863f663dadc3c93021418f524db5eb79
|
3 |
+
size 7819548
|
checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/0.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4d45da65f361b03600e3ddd30f4fab4152c6c5e118821551ad1b1239f0b218e
|
3 |
+
size 7802081
|
checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/0.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:43665bb6a026d64fdb2c2ca188fd8e908fc519f1af7cff39c4bbee1b1c2b8204
|
3 |
+
size 7818668
|
checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/0.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74db57e6bb0bb725ede94ae4022207052af377ac8e2480752aba9995824328c5
|
3 |
+
size 7816582
|
checkpoint_1007000/target.decoder.layers_13.self_attention.query.kernel/0.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:90bc5b873fd47263641d9acdecb42a337eb4977e027a025ba23a8b6c301b9e6e
|
3 |
+
size 7819212
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/.zarray.__tmp10328583312988144199.~1663960300551647~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/.zarray.__tmp13797936759071255094.~1663960300347902~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/.zarray.__tmp13986472075519930249.~1663960300685650~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/.zarray.__tmp1467584061988000765.~1663960300385708~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/.zarray.__tmp16591741030595486867.~1663960300823709~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/.zarray.__tmp18283481202771270668.~1663960300496415~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/.zarray.__tmp4823703594089859210.~1663960300603078~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f2d12d09e343dd64a10da994c6692bb96b263c05f3bb33a96d1408053366f8c1
|
3 |
+
size 7815772
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/0.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d0bed9ccb84c6e04c65f85e9486b834c63f2ded53f2e96fa4b55e062125c7bb3
|
3 |
+
size 7816233
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/0.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b55d8533d9ca46dc438e181d37b9306f37e48d81c6405c2df191d62b0f316d60
|
3 |
+
size 7817375
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/0.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:20e28e814a62d784f02b38235dafbb693d49f34228910da30aec9e94bf437f74
|
3 |
+
size 7815349
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/0.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a809641d0191485eb31d94f9e38a10b717177b4fbcc12be78de0b0c8c0b84b90
|
3 |
+
size 7815180
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/0.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c34febfaba5e598af4bde375a3b3592727cf6a4f9b825565ff0ddc3d468ed182
|
3 |
+
size 7816265
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/0.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63fdeceae2db80130e78c396c9317b5751a21f20cbc6c5fcb0df63d8ee1ffe85
|
3 |
+
size 7814997
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.query.kernel/0.7
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a2a4f27e4aaff1993995cab7bd93133b774d5b53865d3949703591ce4fff5b1d
|
3 |
+
size 7816010
|
checkpoint_1007000/target.decoder.layers_20.self_attention.out.kernel/.zarray.__tmp112152727729513876.~1663960300491658~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.self_attention.out.kernel/.zarray.__tmp6303835615061701227.~1663960300599592~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.self_attention.out.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b40ce9bc78e1bc4259faf4f6007b2b0342a15ce4be2635725e555f7b3effd03c
|
3 |
+
size 7801146
|