Commit
·
0089441
1
Parent(s):
c285da1
Upload part 66
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +50 -0
- checkpoint_1007000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/.zarray.__tmp14050066306458703621.~1663960300089898~ +1 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/.zarray.__tmp14477734361951418052.~1663960301026654~ +1 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/.zarray.__tmp16768930232080000876.~1663960300726012~ +1 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/.zarray.__tmp18233595327996917928.~1663960300134020~ +1 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/.zarray.__tmp2001586061358052897.~1663960299881881~ +1 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/.zarray.__tmp6192635344089027354.~1663960300074781~ +1 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/.zarray.__tmp8167355916865709290.~1663960300073273~ +1 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/.zarray.__tmp12161734215931250339.~1663960300307849~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/.zarray.__tmp12524848541358511717.~1663960300601878~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/.zarray.__tmp12628051982135070532.~1663960300308343~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/.zarray.__tmp16657994182915919170.~1663960300724969~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/.zarray.__tmp2393733624015793071.~1663960300888757~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/.zarray.__tmp9691434283791166311.~1663960300502229~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/1.0 +3 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/2.0 +3 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/3.0 +3 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/4.0 +3 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/5.0 +3 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/6.0 +3 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/7.0 +3 -0
- checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/.zarray.__tmp12038369456628083008.~1663960300500390~ +1 -0
- checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/.zarray.__tmp12834423916420665428.~1663960300495461~ +1 -0
- checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/.zarray.__tmp12994895879745033.~1663960300551356~ +1 -0
- checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/.zarray.__tmp2221344313489107808.~1663960300387123~ +1 -0
- checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/.zarray.__tmp4445478388728139901.~1663960300774328~ +1 -0
- checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/.zarray.__tmp9955060625844959214.~1663960300497171~ +1 -0
- checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/0.7 +3 -0
- checkpoint_1007000/target.encoder.layers_1.pre_attention_layer_norm.scale/.zarray +1 -0
.gitattributes
CHANGED
@@ -3281,3 +3281,53 @@ checkpoint_1007000/target.encoder.layers_17.attention.query.kernel/0.0 filter=lf
|
|
3281 |
checkpoint_1007000/target.encoder.layers_17.attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
3282 |
checkpoint_1007000/target.encoder.layers_17.attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
3283 |
checkpoint_1007000/target.encoder.layers_17.attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
3281 |
checkpoint_1007000/target.encoder.layers_17.attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
3282 |
checkpoint_1007000/target.encoder.layers_17.attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
3283 |
checkpoint_1007000/target.encoder.layers_17.attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
3284 |
+
checkpoint_1007000/target.encoder.layers_17.attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
3285 |
+
checkpoint_1007000/target.encoder.layers_17.attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
3286 |
+
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
3287 |
+
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
3288 |
+
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
3289 |
+
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
3290 |
+
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
3291 |
+
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
3292 |
+
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
3293 |
+
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
3294 |
+
checkpoint_1007000/target.encoder.layers_14.attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
3295 |
+
checkpoint_1007000/target.encoder.layers_14.attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
3296 |
+
checkpoint_1007000/target.encoder.layers_14.attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
3297 |
+
checkpoint_1007000/target.encoder.layers_14.attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
3298 |
+
checkpoint_1007000/target.encoder.layers_14.attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
3299 |
+
checkpoint_1007000/target.encoder.layers_14.attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
3300 |
+
checkpoint_1007000/target.encoder.layers_14.attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
3301 |
+
checkpoint_1007000/target.encoder.layers_14.attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
3302 |
+
checkpoint_1007000/target.encoder.layers_16.attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
3303 |
+
checkpoint_1007000/target.encoder.layers_16.attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
3304 |
+
checkpoint_1007000/target.encoder.layers_16.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
3305 |
+
checkpoint_1007000/target.encoder.layers_16.attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
3306 |
+
checkpoint_1007000/target.encoder.layers_16.attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
3307 |
+
checkpoint_1007000/target.encoder.layers_16.attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
3308 |
+
checkpoint_1007000/target.encoder.layers_16.attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
3309 |
+
checkpoint_1007000/target.encoder.layers_16.attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
3310 |
+
checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
3311 |
+
checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
3312 |
+
checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
3313 |
+
checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
3314 |
+
checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
3315 |
+
checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
3316 |
+
checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
3317 |
+
checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
3318 |
+
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
3319 |
+
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
3320 |
+
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
3321 |
+
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
3322 |
+
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
3323 |
+
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
3324 |
+
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
3325 |
+
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
3326 |
+
checkpoint_1007000/target.encoder.layers_21.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
3327 |
+
checkpoint_1007000/target.encoder.layers_21.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
3328 |
+
checkpoint_1007000/target.encoder.layers_21.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
3329 |
+
checkpoint_1007000/target.encoder.layers_21.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
3330 |
+
checkpoint_1007000/target.encoder.layers_21.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
3331 |
+
checkpoint_1007000/target.encoder.layers_21.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
3332 |
+
checkpoint_1007000/target.encoder.layers_21.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
3333 |
+
checkpoint_1007000/target.encoder.layers_21.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/0
ADDED
Binary file (14.9 kB). View file
|
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/.zarray.__tmp14050066306458703621.~1663960300089898~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/.zarray.__tmp14477734361951418052.~1663960301026654~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/.zarray.__tmp16768930232080000876.~1663960300726012~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/.zarray.__tmp18233595327996917928.~1663960300134020~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/.zarray.__tmp2001586061358052897.~1663960299881881~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/.zarray.__tmp6192635344089027354.~1663960300074781~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/.zarray.__tmp8167355916865709290.~1663960300073273~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47d02dfd28b6f8f86df595bfc4e878488927e4fea7c650aa1a175e5ffd19c0a1
|
3 |
+
size 7805147
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/0.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea21cc05d2895d7da9c6a52185723074e56fd529d29d8f8b83bf9ef2f2ecd87c
|
3 |
+
size 7809425
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/0.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a16a4d456acb52d2b5ad69487051fb1757fa95ead706debdde17a1fe7d1faf1d
|
3 |
+
size 7810129
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/0.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9299f63612e2d082cf4307208de62b5913ed1a70fdd80e47192a7f9cc6de61e5
|
3 |
+
size 7808135
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/0.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9e0dbf00de7d2195aee142e7901c2441595e83017add38060aa4310a2b0d58b
|
3 |
+
size 7802233
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/0.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dfed3836ca7ca95342b2aae10ea85a2498d1d35085b3d26c2ade030a5978527c
|
3 |
+
size 7804792
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/0.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82603ecf6a65de9e44e4574c3bd2ac8fbfab43e05c7faeec9b051cdc9ee0f407
|
3 |
+
size 7803068
|
checkpoint_1007000/target.decoder.layers_0.encoder_decoder_attention.key.kernel/0.7
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e4e56b8d54cf790e9d3e36c837e4df8f22d48ae70f08ff6f1800e44886512c11
|
3 |
+
size 7806197
|
checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/.zarray.__tmp12161734215931250339.~1663960300307849~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/.zarray.__tmp12524848541358511717.~1663960300601878~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/.zarray.__tmp12628051982135070532.~1663960300308343~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/.zarray.__tmp16657994182915919170.~1663960300724969~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/.zarray.__tmp2393733624015793071.~1663960300888757~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/.zarray.__tmp9691434283791166311.~1663960300502229~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7473dd516d180f27c357b4f62d251fb7d3a422c463e909bb7c839713947da58
|
3 |
+
size 7813067
|
checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/1.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7440278eed3165aed7d216ccda35cea4614c9303ca1cbead7f7c594f425b61a5
|
3 |
+
size 7819311
|
checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/2.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ccfde8b42d6f7bf3d65d895ef8b1d9f9ad1fcea2fd37f273619e76a5bf5d7b78
|
3 |
+
size 7819638
|
checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/3.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef91a89d0dfb149b0305a38088a6e585de6addfcbf699a32e5d426a1b6d6aa60
|
3 |
+
size 7818309
|
checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/4.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:54a54c48dc49ae8490233687f90ba9689331ae11e84be605e8c5063f307442b7
|
3 |
+
size 7816244
|
checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/5.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9d20a7d816e3fe98639ddc7354af000961f6a1fbea1566dc953d5165709ef6dc
|
3 |
+
size 7819295
|
checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/6.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5708a79b1bef06d1e8f8cd9c2d20626d55a5bf43b6752a22630845c4e1d5e6bf
|
3 |
+
size 7816941
|
checkpoint_1007000/target.decoder.layers_2.self_attention.out.kernel/7.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:03f26ca0ead9419ea7cfa15817244bbe994d0288e6a9d72acb37efc10cc5b157
|
3 |
+
size 7816682
|
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/.zarray.__tmp12038369456628083008.~1663960300500390~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/.zarray.__tmp12834423916420665428.~1663960300495461~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/.zarray.__tmp12994895879745033.~1663960300551356~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/.zarray.__tmp2221344313489107808.~1663960300387123~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/.zarray.__tmp4445478388728139901.~1663960300774328~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/.zarray.__tmp9955060625844959214.~1663960300497171~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67d085de47b90e0af3954f637367ad44941569aa38027b411897b9330ae2fc9c
|
3 |
+
size 7806698
|
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/0.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:13cad133c55dc8e4c897e8cdf1f91fa4d9e778223f5204550b2b8bde4929696b
|
3 |
+
size 7808017
|
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/0.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0413bee867342984e006f7dcaa896f19ddcb9f8970d224a8ce532da0bf10905a
|
3 |
+
size 7822696
|
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/0.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7cab5ab9c5c176a4a47d3e1df5f4cfefb24146717ae9e666718c13219c4ce9fb
|
3 |
+
size 7809114
|
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/0.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3b728c953a608f8f314af768df8abd59804a2f4c32324e36ce43b2aeef89af52
|
3 |
+
size 7809390
|
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/0.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c76169add9849481976a0fb7135aa55ed00ee03615aae8f372296e66ffa3270
|
3 |
+
size 7810479
|
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/0.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84e86b61ac018a3ba736eb19314b7bd545057eff9eab43824f999cc285bef946
|
3 |
+
size 7808193
|
checkpoint_1007000/target.decoder.layers_7.encoder_decoder_attention.query.kernel/0.7
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:edb72721817bb1dfe5cf969237cfec5c0ac2a85389b0466cb3ccc55ac0168e5b
|
3 |
+
size 7809618
|
checkpoint_1007000/target.encoder.layers_1.pre_attention_layer_norm.scale/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|