Commit
·
d67cac2
1
Parent(s):
7ff1e80
Upload part 8
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +38 -0
- checkpoint_1007000/state.param_states.decoder.layers_8.pre_cross_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_8.pre_cross_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray.__tmp11580674703462496483.~1663960300133883~ +1 -0
- checkpoint_1007000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray.__tmp12013653300323734407.~1663960300075446~ +1 -0
- checkpoint_1007000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray.__tmp1439279929598701435.~1663960300016739~ +1 -0
- checkpoint_1007000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray.__tmp15358612188062969342.~1663960299886873~ +1 -0
- checkpoint_1007000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray.__tmp16156460410913044609.~1663960300090205~ +1 -0
- checkpoint_1007000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray.__tmp18378342970470495361.~1663960300548461~ +1 -0
- checkpoint_1007000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray.__tmp227103591838630531.~1663960300984367~ +1 -0
- checkpoint_1007000/state.param_states.decoder.relpos_bias.rel_embedding.v/0.0 +0 -0
- checkpoint_1007000/state.param_states.decoder.relpos_bias.rel_embedding.v/1.0 +0 -0
- checkpoint_1007000/state.param_states.decoder.relpos_bias.rel_embedding.v/2.0 +0 -0
- checkpoint_1007000/state.param_states.decoder.relpos_bias.rel_embedding.v/3.0 +0 -0
- checkpoint_1007000/state.param_states.decoder.relpos_bias.rel_embedding.v/4.0 +0 -0
- checkpoint_1007000/state.param_states.decoder.relpos_bias.rel_embedding.v/5.0 +0 -0
- checkpoint_1007000/state.param_states.decoder.relpos_bias.rel_embedding.v/7.0 +0 -0
- checkpoint_1007000/state.param_states.encoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.encoder.layers_1.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/.zarray.__tmp13990057939055935324.~1663960300271662~ +1 -0
- checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/.zarray.__tmp2183204862279246314.~1663960300307572~ +1 -0
- checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/.zarray.__tmp3221719338029875643.~1663960300420431~ +1 -0
- checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/.zarray.__tmp4659058574314254544.~1663960300222823~ +1 -0
- checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/.zarray.__tmp8672360034043645680.~1663960300625653~ +1 -0
- checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/.zarray.__tmp8937493478627982074.~1663960300089977~ +1 -0
- checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/.zarray.__tmp13086528977603015265.~1663960300826535~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/.zarray.__tmp13626986717575320523.~1663960300423568~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/.zarray.__tmp4400733564188167551.~1663960300728424~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/.zarray.__tmp490738057587649164.~1663960300348075~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/.zarray.__tmp5373375306913877844.~1663960300550916~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/.zarray.__tmp7614666875835642548.~1663960300546990~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/.zarray.__tmp7920143289180409639.~1663960300467775~ +1 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/0.6 +3 -0
.gitattributes
CHANGED
@@ -419,3 +419,41 @@ checkpoint_1007000/target.encoder.layers_12.attention.query.kernel/0.5 filter=lf
|
|
419 |
checkpoint_1007000/target.encoder.layers_12.attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
420 |
checkpoint_1007000/target.encoder.layers_12.attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
421 |
checkpoint_1007000/target.encoder.layers_12.attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
419 |
checkpoint_1007000/target.encoder.layers_12.attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
420 |
checkpoint_1007000/target.encoder.layers_12.attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
421 |
checkpoint_1007000/target.encoder.layers_12.attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
422 |
+
checkpoint_1007000/target.encoder.layers_7.attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
423 |
+
checkpoint_1007000/target.encoder.layers_7.attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
424 |
+
checkpoint_1007000/target.encoder.layers_7.attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
425 |
+
checkpoint_1007000/target.encoder.layers_7.attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
426 |
+
checkpoint_1007000/target.encoder.layers_7.attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
427 |
+
checkpoint_1007000/target.encoder.layers_7.attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
428 |
+
checkpoint_1007000/target.encoder.layers_7.attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
429 |
+
checkpoint_1007000/target.encoder.layers_7.attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
430 |
+
checkpoint_1007000/target.encoder.layers_9.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
431 |
+
checkpoint_1007000/target.encoder.layers_9.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
432 |
+
checkpoint_1007000/target.encoder.layers_9.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
433 |
+
checkpoint_1007000/target.encoder.layers_9.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
434 |
+
checkpoint_1007000/target.encoder.layers_9.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
435 |
+
checkpoint_1007000/target.encoder.layers_9.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
436 |
+
checkpoint_1007000/target.encoder.layers_9.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
437 |
+
checkpoint_1007000/target.encoder.layers_9.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
438 |
+
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
439 |
+
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
440 |
+
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
441 |
+
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
442 |
+
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
443 |
+
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
444 |
+
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
445 |
+
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
446 |
+
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
447 |
+
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
448 |
+
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
449 |
+
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
450 |
+
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
451 |
+
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
452 |
+
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
453 |
+
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
454 |
+
checkpoint_1007000/target.decoder.layers_8.self_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
455 |
+
checkpoint_1007000/target.decoder.layers_8.self_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
456 |
+
checkpoint_1007000/target.decoder.layers_8.self_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
457 |
+
checkpoint_1007000/target.decoder.layers_8.self_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
458 |
+
checkpoint_1007000/target.decoder.layers_8.self_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
459 |
+
checkpoint_1007000/target.decoder.layers_8.self_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/state.param_states.decoder.layers_8.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_8.pre_cross_attention_layer_norm.scale.v/0
ADDED
Binary file (14.9 kB). View file
|
|
checkpoint_1007000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[8,32],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[64,32],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray.__tmp11580674703462496483.~1663960300133883~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[8,32],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[64,32],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray.__tmp12013653300323734407.~1663960300075446~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[8,32],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[64,32],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray.__tmp1439279929598701435.~1663960300016739~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[8,32],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[64,32],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray.__tmp15358612188062969342.~1663960299886873~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[8,32],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[64,32],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray.__tmp16156460410913044609.~1663960300090205~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[8,32],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[64,32],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray.__tmp18378342970470495361.~1663960300548461~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[8,32],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[64,32],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray.__tmp227103591838630531.~1663960300984367~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[8,32],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[64,32],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.relpos_bias.rel_embedding.v/0.0
ADDED
Binary file (1 kB). View file
|
|
checkpoint_1007000/state.param_states.decoder.relpos_bias.rel_embedding.v/1.0
ADDED
Binary file (1.01 kB). View file
|
|
checkpoint_1007000/state.param_states.decoder.relpos_bias.rel_embedding.v/2.0
ADDED
Binary file (1.02 kB). View file
|
|
checkpoint_1007000/state.param_states.decoder.relpos_bias.rel_embedding.v/3.0
ADDED
Binary file (1 kB). View file
|
|
checkpoint_1007000/state.param_states.decoder.relpos_bias.rel_embedding.v/4.0
ADDED
Binary file (1.01 kB). View file
|
|
checkpoint_1007000/state.param_states.decoder.relpos_bias.rel_embedding.v/5.0
ADDED
Binary file (1 kB). View file
|
|
checkpoint_1007000/state.param_states.decoder.relpos_bias.rel_embedding.v/7.0
ADDED
Binary file (1.01 kB). View file
|
|
checkpoint_1007000/state.param_states.encoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.encoder.layers_1.pre_mlp_layer_norm.scale.v/0
ADDED
Binary file (15.3 kB). View file
|
|
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/.zarray.__tmp13990057939055935324.~1663960300271662~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/.zarray.__tmp2183204862279246314.~1663960300307572~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/.zarray.__tmp3221719338029875643.~1663960300420431~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/.zarray.__tmp4659058574314254544.~1663960300222823~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/.zarray.__tmp8672360034043645680.~1663960300625653~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/.zarray.__tmp8937493478627982074.~1663960300089977~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8415ef9b65d0c79457afd8f76637688647612f8cd83956136d13aed5192c9c74
|
3 |
+
size 7804198
|
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/0.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:13cc7cd9a50cd2f0a20ac7a89636f994b255a3b734fcd29466dca2a3aaf0dd1b
|
3 |
+
size 7803396
|
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/0.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:32e1c03969b5db84051e390f710dd5b03752cab42c49409862c9981b3c5fa5d1
|
3 |
+
size 7804501
|
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/0.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:72adb90a2d249e342c9744f9ec8eb84d2f4c4569f2283b5b35cbe038953c08d0
|
3 |
+
size 7805500
|
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/0.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1b4231c23df965763d6b0cbbfe54dd2a4631930b293936d5792712baa75dd054
|
3 |
+
size 7804889
|
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/0.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8ff46acd36d20955cd6c569b9d8958c14abb74561a8cec10c0cc69b852364ded
|
3 |
+
size 7804234
|
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/0.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67268da62bab1c54fffd067a28cec030ed09a878894c5eb4de47267bd7afe734
|
3 |
+
size 7804133
|
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.query.kernel/0.7
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ba876a22c8ad2b7199b571c3f5a04cc437bdcd259f965a1a255a6ca09cbdc9ca
|
3 |
+
size 7803263
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/.zarray.__tmp13086528977603015265.~1663960300826535~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/.zarray.__tmp13626986717575320523.~1663960300423568~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/.zarray.__tmp4400733564188167551.~1663960300728424~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/.zarray.__tmp490738057587649164.~1663960300348075~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/.zarray.__tmp5373375306913877844.~1663960300550916~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/.zarray.__tmp7614666875835642548.~1663960300546990~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/.zarray.__tmp7920143289180409639.~1663960300467775~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ec65cf62a11071470ce12a7fd93ac38f57479d5d4e881c5178a325414251a0a
|
3 |
+
size 7807108
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/0.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c086032c0bf31631bbe464600ac761184daca58caaf02cc963b73ea0f012e514
|
3 |
+
size 7803043
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/0.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f7e5c3e4fa0cae4d062a5309eb16421a096b4f095ac4ce5f3e34037dd4192f08
|
3 |
+
size 7802922
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/0.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7494a1c53823ba2e7c5b6e8f5f191269a836a518575d5799a8a6b54b1171377e
|
3 |
+
size 7797853
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/0.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b725f47c05dedc259f818196c16a4e1bfdb16c83b57a6942e98b2e85b46a48db
|
3 |
+
size 7800211
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/0.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:00cbd469f23ebcec44a76ab29bdea583b60e72cadc758a4832096cc3d76155d0
|
3 |
+
size 7803725
|
checkpoint_1007000/target.decoder.layers_12.encoder_decoder_attention.value.kernel/0.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1b617bd0e615f55ffd86c9571490ba47b7c9fc84b5941fcb399e3f3dadd526ea
|
3 |
+
size 7799615
|