Commit
·
fde254a
1
Parent(s):
960b0d6
Upload part 53
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +48 -0
- checkpoint_1007000/state.param_states.decoder.layers_23.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_23.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/target.decoder.layers_12.pre_mlp_layer_norm.scale/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_12.pre_mlp_layer_norm.scale/0 +0 -0
- checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray.__tmp11256787251253775817.~1663960300467721~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray.__tmp12376700607849326301.~1663960300873893~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray.__tmp13988132894120306426.~1663960300465831~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray.__tmp2003657211397809811.~1663960300499679~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray.__tmp3018502066720724520.~1663960300422243~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray.__tmp5367369300786217474.~1663960300272671~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray.__tmp9890861163220608993.~1663960300865166~ +1 -0
- checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/1.0 +3 -0
- checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/2.0 +3 -0
- checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/3.0 +3 -0
- checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/4.0 +3 -0
- checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/5.0 +3 -0
- checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/6.0 +3 -0
- checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/7.0 +3 -0
- checkpoint_1007000/target.decoder.layers_5.pre_self_attention_layer_norm.scale/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_5.pre_self_attention_layer_norm.scale/0 +0 -0
- checkpoint_1007000/target.decoder.layers_7.pre_mlp_layer_norm.scale/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_7.pre_mlp_layer_norm.scale/0 +0 -0
- checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray.__tmp14160688709433772055.~1663960300611045~ +1 -0
- checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray.__tmp15873416349169901159.~1663960300826076~ +1 -0
- checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray.__tmp16849527841429843420.~1663960300468248~ +1 -0
- checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray.__tmp4255918781242121777.~1663960300779427~ +1 -0
- checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray.__tmp4421445606442611016.~1663960300384782~ +1 -0
- checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray.__tmp4539221328564997070.~1663960300600813~ +1 -0
- checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray.__tmp9398104159734428444.~1663960300688560~ +1 -0
- checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.7 +3 -0
- checkpoint_1007000/target.encoder.layers_13.pre_attention_layer_norm.scale/.zarray +1 -0
- checkpoint_1007000/target.encoder.layers_13.pre_attention_layer_norm.scale/0 +0 -0
- checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/.zarray +1 -0
- checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/.zarray.__tmp11915811710181766548.~1663960300425573~ +1 -0
- checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/.zarray.__tmp12223102092994640126.~1663960300724757~ +1 -0
- checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/.zarray.__tmp16570448508998648983.~1663960300609977~ +1 -0
- checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/.zarray.__tmp17425754235712849754.~1663960300421170~ +1 -0
- checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/.zarray.__tmp1843410830924711088.~1663960300545905~ +1 -0
- checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/.zarray.__tmp5183710400972140093.~1663960300626578~ +1 -0
.gitattributes
CHANGED
@@ -2673,3 +2673,51 @@ checkpoint_1007000/target.encoder.layers_8.attention.out.kernel/3.0 filter=lfs d
|
|
2673 |
checkpoint_1007000/target.encoder.layers_8.attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2674 |
checkpoint_1007000/target.encoder.layers_8.attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
2675 |
checkpoint_1007000/target.encoder.layers_8.attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2673 |
checkpoint_1007000/target.encoder.layers_8.attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2674 |
checkpoint_1007000/target.encoder.layers_8.attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
2675 |
checkpoint_1007000/target.encoder.layers_8.attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
2676 |
+
checkpoint_1007000/target.encoder.layers_8.attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
2677 |
+
checkpoint_1007000/target.encoder.layers_8.attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
2678 |
+
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
2679 |
+
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
2680 |
+
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2681 |
+
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
2682 |
+
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
2683 |
+
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
2684 |
+
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
2685 |
+
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
2686 |
+
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
2687 |
+
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
2688 |
+
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
2689 |
+
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2690 |
+
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
2691 |
+
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
2692 |
+
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
2693 |
+
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
2694 |
+
checkpoint_1007000/target.encoder.layers_20.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
2695 |
+
checkpoint_1007000/target.encoder.layers_20.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
2696 |
+
checkpoint_1007000/target.encoder.layers_20.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2697 |
+
checkpoint_1007000/target.encoder.layers_20.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
2698 |
+
checkpoint_1007000/target.encoder.layers_20.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
2699 |
+
checkpoint_1007000/target.encoder.layers_20.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
2700 |
+
checkpoint_1007000/target.encoder.layers_20.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
2701 |
+
checkpoint_1007000/target.encoder.layers_20.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
2702 |
+
checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
2703 |
+
checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
2704 |
+
checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2705 |
+
checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
2706 |
+
checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
2707 |
+
checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
2708 |
+
checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
2709 |
+
checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
2710 |
+
checkpoint_1007000/target.encoder.layers_3.attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
2711 |
+
checkpoint_1007000/target.encoder.layers_3.attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
2712 |
+
checkpoint_1007000/target.encoder.layers_3.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2713 |
+
checkpoint_1007000/target.encoder.layers_3.attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
2714 |
+
checkpoint_1007000/target.encoder.layers_3.attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
2715 |
+
checkpoint_1007000/target.encoder.layers_3.attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
2716 |
+
checkpoint_1007000/target.encoder.layers_3.attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
2717 |
+
checkpoint_1007000/target.encoder.layers_3.attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
2718 |
+
checkpoint_1007000/target.encoder.layers_19.attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
2719 |
+
checkpoint_1007000/target.encoder.layers_19.attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
2720 |
+
checkpoint_1007000/target.encoder.layers_19.attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
2721 |
+
checkpoint_1007000/target.encoder.layers_19.attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2722 |
+
checkpoint_1007000/target.encoder.layers_19.attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
2723 |
+
checkpoint_1007000/target.encoder.layers_19.attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/state.param_states.decoder.layers_23.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_23.pre_mlp_layer_norm.scale.v/0
ADDED
Binary file (14.4 kB). View file
|
|
checkpoint_1007000/target.decoder.layers_12.pre_mlp_layer_norm.scale/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_12.pre_mlp_layer_norm.scale/0
ADDED
Binary file (14.7 kB). View file
|
|
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray.__tmp11256787251253775817.~1663960300467721~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray.__tmp12376700607849326301.~1663960300873893~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray.__tmp13988132894120306426.~1663960300465831~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray.__tmp2003657211397809811.~1663960300499679~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray.__tmp3018502066720724520.~1663960300422243~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray.__tmp5367369300786217474.~1663960300272671~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray.__tmp9890861163220608993.~1663960300865166~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4cd567082bc1f857b9b74c39f20a14a54305030750f427447b78060559ccd655
|
3 |
+
size 19536740
|
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/1.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b7f042ee0239a3d75d39afe8aa605232aeb518a417baf6fe51b4dc678b69362f
|
3 |
+
size 19536437
|
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/2.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1740f1ff22b516d28755469b4ad3d05f5b5c482bee78c865d9ebd95ccdbf1fc5
|
3 |
+
size 19537072
|
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/3.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de72446230ffd496ba585f0789ac98497f83e8209c566efbe56df1f47f6cb308
|
3 |
+
size 19535933
|
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/4.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af0711164d99a304bef96bce45cacb8755fdd45d4cad80c8d78608f58fb2c24b
|
3 |
+
size 19536727
|
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/5.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a6d2c6d716aa8dc6e97c4eb957c36551d34654a313302a99c4c9a5e5e59cf415
|
3 |
+
size 19536375
|
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/6.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:514530b30562578cf9a28b04e3162478be54e63b7528c5c919b6d5aefa2bb237
|
3 |
+
size 19538075
|
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/7.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f16d2ad632fc66c5557464c7e93cb0bffa99c5a69ca6918743599d2bff9cdbc4
|
3 |
+
size 19536537
|
checkpoint_1007000/target.decoder.layers_5.pre_self_attention_layer_norm.scale/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_5.pre_self_attention_layer_norm.scale/0
ADDED
Binary file (15 kB). View file
|
|
checkpoint_1007000/target.decoder.layers_7.pre_mlp_layer_norm.scale/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_7.pre_mlp_layer_norm.scale/0
ADDED
Binary file (14.7 kB). View file
|
|
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray.__tmp14160688709433772055.~1663960300611045~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray.__tmp15873416349169901159.~1663960300826076~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray.__tmp16849527841429843420.~1663960300468248~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray.__tmp4255918781242121777.~1663960300779427~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray.__tmp4421445606442611016.~1663960300384782~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray.__tmp4539221328564997070.~1663960300600813~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray.__tmp9398104159734428444.~1663960300688560~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84b18db2f91f2930220701c7ee39da698d3f6bb679e1f82ac04f67ed6c660c70
|
3 |
+
size 7820805
|
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:17baf72eb0cd4b6bd3ef9ac000c04e00462a0b8f9a71bf2fe45b1ba47ac8747e
|
3 |
+
size 7821468
|
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bc7364a6be8a0c3a59b9980a7dd2d2efc2d525e6ca7756e1bafbc097e22598a5
|
3 |
+
size 7821758
|
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b6600f27687e4f790246618db3c46d1b7875fe1af316996a7d5144c3c843026
|
3 |
+
size 7822096
|
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7c42cd53d4d32e7063f179d3103805595770bd55f51de131ddab5617c126608b
|
3 |
+
size 7822824
|
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0392651ed9dda37b1230de96fc28b1c31fcaa91bd35738f9fdf98e80d890d665
|
3 |
+
size 7820366
|
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96a6fc8fb0b7262fe49ea1801870c6026fd0125d8e4848719974871ebe3d4c44
|
3 |
+
size 7821561
|
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.7
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:035628cf1a31400d6bd3b3e07b19dc58102cb4f9a9114de20359520009cf847c
|
3 |
+
size 7821431
|
checkpoint_1007000/target.encoder.layers_13.pre_attention_layer_norm.scale/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_13.pre_attention_layer_norm.scale/0
ADDED
Binary file (15.1 kB). View file
|
|
checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/.zarray.__tmp11915811710181766548.~1663960300425573~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/.zarray.__tmp12223102092994640126.~1663960300724757~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/.zarray.__tmp16570448508998648983.~1663960300609977~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/.zarray.__tmp17425754235712849754.~1663960300421170~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/.zarray.__tmp1843410830924711088.~1663960300545905~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/.zarray.__tmp5183710400972140093.~1663960300626578~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|