Commit
·
2870955
1
Parent(s):
97cbfe7
Upload part 51
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +51 -0
- checkpoint_1007000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/target.decoder.layers_0.pre_mlp_layer_norm.scale/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_0.pre_mlp_layer_norm.scale/0 +0 -0
- checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/.zarray.__tmp13860182128134203581.~1663960300271669~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/.zarray.__tmp14915792012948216155.~1663960300501020~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/.zarray.__tmp17163698119452819470.~1663960300383704~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/.zarray.__tmp3406813367688477231.~1663960300349079~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/.zarray.__tmp5655637283001257113.~1663960300548058~ +1 -0
- checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/1.0 +3 -0
- checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/2.0 +3 -0
- checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/3.0 +3 -0
- checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/4.0 +3 -0
- checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/5.0 +3 -0
- checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/6.0 +3 -0
- checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/7.0 +3 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/.zarray.__tmp13274847707321780589.~1663960300780488~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/.zarray.__tmp17395252829058526076.~1663960300826503~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/.zarray.__tmp213421870206833707.~1663960300727333~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/.zarray.__tmp5003615787769520833.~1663960300600253~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/.zarray.__tmp8340153163930010786.~1663960300554676~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/.zarray.__tmp84303314120511463.~1663960300683617~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/.zarray.__tmp924297596789801472.~1663960300730478~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/.zarray.__tmp18331374512781114445.~1663960300822447~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/.zarray.__tmp5794916223614252314.~1663960300549840~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/.zarray.__tmp835427842764133382.~1663960301071694~ +1 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_15.mlp.wo.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_15.mlp.wo.kernel/.zarray.__tmp12186219544965510441.~1663960300554922~ +1 -0
- checkpoint_1007000/target.decoder.layers_15.mlp.wo.kernel/.zarray.__tmp14892187662735011810.~1663960300495824~ +1 -0
- checkpoint_1007000/target.decoder.layers_15.mlp.wo.kernel/.zarray.__tmp15649225097279147311.~1663960300549126~ +1 -0
- checkpoint_1007000/target.decoder.layers_15.mlp.wo.kernel/.zarray.__tmp16478649895859384621.~1663960300549221~ +1 -0
- checkpoint_1007000/target.decoder.layers_15.mlp.wo.kernel/.zarray.__tmp3285463423068203750.~1663960300419957~ +1 -0
- checkpoint_1007000/target.decoder.layers_15.mlp.wo.kernel/.zarray.__tmp3966636191724702222.~1663960300728530~ +1 -0
- checkpoint_1007000/target.decoder.layers_15.mlp.wo.kernel/.zarray.__tmp6342605954107965772.~1663960300465730~ +1 -0
.gitattributes
CHANGED
@@ -2575,3 +2575,54 @@ checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.1 filter=lfs diff=
|
|
2575 |
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
2576 |
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2577 |
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2575 |
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
2576 |
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2577 |
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
2578 |
+
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
2579 |
+
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
2580 |
+
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
2581 |
+
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
2582 |
+
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
2583 |
+
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
2584 |
+
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2585 |
+
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
2586 |
+
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
2587 |
+
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
2588 |
+
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
2589 |
+
checkpoint_1007000/target.decoder.layers_21.encoder_decoder_attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
2590 |
+
checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
2591 |
+
checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
2592 |
+
checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
2593 |
+
checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2594 |
+
checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
2595 |
+
checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
2596 |
+
checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
2597 |
+
checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
2598 |
+
checkpoint_1007000/target.decoder.layers_15.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
2599 |
+
checkpoint_1007000/target.decoder.layers_15.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
2600 |
+
checkpoint_1007000/target.decoder.layers_15.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
2601 |
+
checkpoint_1007000/target.decoder.layers_15.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2602 |
+
checkpoint_1007000/target.decoder.layers_15.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
2603 |
+
checkpoint_1007000/target.decoder.layers_15.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
2604 |
+
checkpoint_1007000/target.decoder.layers_15.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
2605 |
+
checkpoint_1007000/target.decoder.layers_15.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
2606 |
+
checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
2607 |
+
checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
2608 |
+
checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2609 |
+
checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
2610 |
+
checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
2611 |
+
checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
2612 |
+
checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
2613 |
+
checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
2614 |
+
checkpoint_1007000/target.encoder.layers_23.attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
2615 |
+
checkpoint_1007000/target.encoder.layers_23.attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
2616 |
+
checkpoint_1007000/target.encoder.layers_23.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2617 |
+
checkpoint_1007000/target.encoder.layers_23.attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
2618 |
+
checkpoint_1007000/target.encoder.layers_23.attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
2619 |
+
checkpoint_1007000/target.encoder.layers_23.attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
2620 |
+
checkpoint_1007000/target.encoder.layers_23.attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
2621 |
+
checkpoint_1007000/target.encoder.layers_23.attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
2622 |
+
checkpoint_1007000/target.decoder.layers_19.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
2623 |
+
checkpoint_1007000/target.decoder.layers_19.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
2624 |
+
checkpoint_1007000/target.decoder.layers_19.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
2625 |
+
checkpoint_1007000/target.decoder.layers_19.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2626 |
+
checkpoint_1007000/target.decoder.layers_19.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
2627 |
+
checkpoint_1007000/target.decoder.layers_19.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
2628 |
+
checkpoint_1007000/target.decoder.layers_19.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/0
ADDED
Binary file (14.9 kB). View file
|
|
checkpoint_1007000/target.decoder.layers_0.pre_mlp_layer_norm.scale/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.pre_mlp_layer_norm.scale/0
ADDED
Binary file (14.4 kB). View file
|
|
checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/.zarray.__tmp13860182128134203581.~1663960300271669~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/.zarray.__tmp14915792012948216155.~1663960300501020~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/.zarray.__tmp17163698119452819470.~1663960300383704~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/.zarray.__tmp3406813367688477231.~1663960300349079~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/.zarray.__tmp5655637283001257113.~1663960300548058~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09598c2d2e1dc1b3e48f1425155b85add328605cedfdaab2eac9e27337154acf
|
3 |
+
size 7819799
|
checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/1.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc3fad3b262efe7d4a5d485c22dc2096bb5d01662fcb977d01e56a04cb910834
|
3 |
+
size 7819343
|
checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/2.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:14c51accb230c8f1441dbcbde5d1671bf78f7e99a95295179978919e05a31cae
|
3 |
+
size 7820685
|
checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/3.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98371b044298a2856fd4fe6b6992210018ac51a9a71a185e130b0749ab90f3c2
|
3 |
+
size 7818645
|
checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/4.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:83967053fe4c2c61ce2cc2e72d46fbe1060b34806c55f5f19b2efe3c59a3beec
|
3 |
+
size 7819763
|
checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/5.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca82019ced52974ad804c8bf55a63f9fd8b0cba5783f3d358326907fd5b919cf
|
3 |
+
size 7818666
|
checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/6.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4bd2af6f089ba6a8f875b812a7753005a0d6fe5495b10e99da2b7ef151be9f3f
|
3 |
+
size 7817429
|
checkpoint_1007000/target.decoder.layers_11.self_attention.out.kernel/7.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:054586900db748deedda49a021e34fd7f91bf58d690f647f3a3f6b0e5c014fb0
|
3 |
+
size 7817990
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/.zarray.__tmp13274847707321780589.~1663960300780488~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/.zarray.__tmp17395252829058526076.~1663960300826503~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/.zarray.__tmp213421870206833707.~1663960300727333~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/.zarray.__tmp5003615787769520833.~1663960300600253~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/.zarray.__tmp8340153163930010786.~1663960300554676~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/.zarray.__tmp84303314120511463.~1663960300683617~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/.zarray.__tmp924297596789801472.~1663960300730478~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d3cf41281e43a74ce1e0307e5db0611a149d86aa4ccbb500a63de1d17cc5f147
|
3 |
+
size 19534120
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/0.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:baede549f8e7deda3488946c53e0c160eafa1dd4715eb394ec3f91e90e583831
|
3 |
+
size 19535274
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/0.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68245c82a3cbe4348f1dd561aa088d8b72b042d99ec6ac870d2d75a379069723
|
3 |
+
size 19534720
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/0.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6161b3b5a4aa5f4495326bf29024d96040c720fe35b1a2be9943f4c953bbdd66
|
3 |
+
size 19533904
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/0.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:943d7d9ccd8c438612c295fa27639098a2720ea5171491fccbd25e9376720377
|
3 |
+
size 19534882
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/0.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:61403a81040a36f09a55ecdc089d8058df92b55cfac2914f248db1f19922717d
|
3 |
+
size 19535145
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/0.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78a0fbe1497b8d461f8640567c6561fcf4075cd3792204fd7c6f863019b02af5
|
3 |
+
size 19534518
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_0.kernel/0.7
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99bbab6b8f0afcd643695409650a26e22dcb0f5e27c061d9f14dbcabe813704d
|
3 |
+
size 19535172
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/.zarray.__tmp18331374512781114445.~1663960300822447~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/.zarray.__tmp5794916223614252314.~1663960300549840~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/.zarray.__tmp835427842764133382.~1663960301071694~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef2f22620fdf8d8280a5bd129585be82a60c6d86c09ac0cba26f996ffca3fa0f
|
3 |
+
size 19517127
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:751606f3a8d54a92e7805b84c22cf2e1ba3275bb0a5400d46b0ebc61e976dd1e
|
3 |
+
size 19517527
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bfd3a6ddd6f3a025953b461928f1c9bbb6db7a2bc2556d831cc635d5d074c299
|
3 |
+
size 19517332
|
checkpoint_1007000/target.decoder.layers_13.mlp.wi_1.kernel/0.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f45fd5529fcf8dc75b94d8b860d1ecd270f43a43053a199de327e57a56aa4a72
|
3 |
+
size 19518280
|
checkpoint_1007000/target.decoder.layers_15.mlp.wo.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_15.mlp.wo.kernel/.zarray.__tmp12186219544965510441.~1663960300554922~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_15.mlp.wo.kernel/.zarray.__tmp14892187662735011810.~1663960300495824~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_15.mlp.wo.kernel/.zarray.__tmp15649225097279147311.~1663960300549126~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_15.mlp.wo.kernel/.zarray.__tmp16478649895859384621.~1663960300549221~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_15.mlp.wo.kernel/.zarray.__tmp3285463423068203750.~1663960300419957~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_15.mlp.wo.kernel/.zarray.__tmp3966636191724702222.~1663960300728530~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_15.mlp.wo.kernel/.zarray.__tmp6342605954107965772.~1663960300465730~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|