Commit
·
0f3aef5
1
Parent(s):
8c8fd09
Upload part 39
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +49 -0
- checkpoint_1007000/state.param_states.decoder.layers_23.pre_self_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_23.pre_self_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/.zarray.__tmp3793136575924832461.~1663960300471028~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/.zarray.__tmp3828504504174363840.~1663960300504917~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/.zarray.__tmp4841820670922943543.~1663960300599408~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/.zarray.__tmp4883026910358667386.~1663960300505005~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/.zarray.__tmp6065072650473970600.~1663960300420127~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/.zarray.__tmp7179883116167104197.~1663960300425528~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/.zarray.__tmp7285427626859680122.~1663960300775053~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/1.0 +3 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/2.0 +3 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/3.0 +3 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/4.0 +3 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/5.0 +3 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/6.0 +3 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/7.0 +3 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/.zarray.__tmp11641026415366376429.~1663960300688455~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/.zarray.__tmp15086851991299262910.~1663960300424961~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/.zarray.__tmp10223974096948240717.~1663960300774109~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/.zarray.__tmp11003946157143400568.~1663960300823025~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/.zarray.__tmp12169865525578298057.~1663960300420411~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/.zarray.__tmp15299951200537059570.~1663960300467147~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/.zarray.__tmp16754694326085659845.~1663960301030840~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/.zarray.__tmp6899721829295772493.~1663960300551877~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/.zarray.__tmp9305821517494390229.~1663960300351245~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/1.0 +3 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/2.0 +3 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/3.0 +3 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/4.0 +3 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/5.0 +3 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/6.0 +3 -0
- checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/7.0 +3 -0
- checkpoint_1007000/target.decoder.layers_3.pre_cross_attention_layer_norm.scale/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_3.pre_cross_attention_layer_norm.scale/0 +0 -0
- checkpoint_1007000/target.decoder.layers_8.self_attention.out.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_8.self_attention.out.kernel/.zarray.__tmp1089770536934074408.~1663960300307684~ +1 -0
- checkpoint_1007000/target.decoder.layers_8.self_attention.out.kernel/.zarray.__tmp14675306242868088798.~1663960300779261~ +1 -0
- checkpoint_1007000/target.decoder.layers_8.self_attention.out.kernel/.zarray.__tmp15683271990944503386.~1663960300311869~ +1 -0
- checkpoint_1007000/target.decoder.layers_8.self_attention.out.kernel/.zarray.__tmp2648441519406468586.~1663960300090606~ +1 -0
- checkpoint_1007000/target.decoder.layers_8.self_attention.out.kernel/.zarray.__tmp4613967575850716566.~1663960300601965~ +1 -0
.gitattributes
CHANGED
@@ -1990,3 +1990,52 @@ checkpoint_1007000/target.decoder.layers_9.mlp.wo.kernel/4.0 filter=lfs diff=lfs
|
|
1990 |
checkpoint_1007000/target.encoder.layers_2.attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
1991 |
checkpoint_1007000/target.encoder.layers_2.attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
1992 |
checkpoint_1007000/target.encoder.layers_2.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1990 |
checkpoint_1007000/target.encoder.layers_2.attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
1991 |
checkpoint_1007000/target.encoder.layers_2.attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
1992 |
checkpoint_1007000/target.encoder.layers_2.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
1993 |
+
checkpoint_1007000/target.encoder.layers_2.attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
1994 |
+
checkpoint_1007000/target.encoder.layers_2.attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
1995 |
+
checkpoint_1007000/target.encoder.layers_2.attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
1996 |
+
checkpoint_1007000/target.encoder.layers_2.attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
1997 |
+
checkpoint_1007000/target.encoder.layers_2.attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
1998 |
+
checkpoint_1007000/target.encoder.layers_2.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
1999 |
+
checkpoint_1007000/target.encoder.layers_2.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
2000 |
+
checkpoint_1007000/target.encoder.layers_2.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2001 |
+
checkpoint_1007000/target.encoder.layers_2.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
2002 |
+
checkpoint_1007000/target.encoder.layers_2.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
2003 |
+
checkpoint_1007000/target.encoder.layers_2.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
2004 |
+
checkpoint_1007000/target.encoder.layers_2.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
2005 |
+
checkpoint_1007000/target.encoder.layers_2.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
2006 |
+
checkpoint_1007000/target.encoder.layers_8.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
2007 |
+
checkpoint_1007000/target.encoder.layers_8.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
2008 |
+
checkpoint_1007000/target.encoder.layers_8.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2009 |
+
checkpoint_1007000/target.encoder.layers_8.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
2010 |
+
checkpoint_1007000/target.encoder.layers_8.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
2011 |
+
checkpoint_1007000/target.encoder.layers_8.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
2012 |
+
checkpoint_1007000/target.encoder.layers_8.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
2013 |
+
checkpoint_1007000/target.encoder.layers_8.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
2014 |
+
checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
2015 |
+
checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
2016 |
+
checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
2017 |
+
checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2018 |
+
checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
2019 |
+
checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
2020 |
+
checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
2021 |
+
checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
2022 |
+
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
2023 |
+
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
2024 |
+
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
2025 |
+
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2026 |
+
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
2027 |
+
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
2028 |
+
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
2029 |
+
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
2030 |
+
checkpoint_1007000/target.decoder.layers_8.self_attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
2031 |
+
checkpoint_1007000/target.decoder.layers_8.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
2032 |
+
checkpoint_1007000/target.decoder.layers_8.self_attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
2033 |
+
checkpoint_1007000/target.decoder.layers_8.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2034 |
+
checkpoint_1007000/target.decoder.layers_8.self_attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
2035 |
+
checkpoint_1007000/target.decoder.layers_8.self_attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
2036 |
+
checkpoint_1007000/target.decoder.layers_8.self_attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
2037 |
+
checkpoint_1007000/target.decoder.layers_8.self_attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
2038 |
+
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
2039 |
+
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
2040 |
+
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2041 |
+
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/state.param_states.decoder.layers_23.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_23.pre_self_attention_layer_norm.scale.v/0
ADDED
Binary file (14.3 kB). View file
|
|
checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/.zarray.__tmp3793136575924832461.~1663960300471028~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/.zarray.__tmp3828504504174363840.~1663960300504917~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/.zarray.__tmp4841820670922943543.~1663960300599408~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/.zarray.__tmp4883026910358667386.~1663960300505005~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/.zarray.__tmp6065072650473970600.~1663960300420127~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/.zarray.__tmp7179883116167104197.~1663960300425528~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/.zarray.__tmp7285427626859680122.~1663960300775053~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1f7400b3c517e3a4d6142b2c78897eb50d732be5340f3c5e4a7adda006c264a
|
3 |
+
size 19533332
|
checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/1.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ce925b430f2548e6d7e5b9d7616dff8d56fb346118dafc3649bd82a8c5b9a2e4
|
3 |
+
size 19534128
|
checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/2.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:773d26052df1f2567873f83c9ae4e140dcda2d604128d738ff66ef9d5321a326
|
3 |
+
size 19532162
|
checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/3.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09b2d551dba53cb6b3497551f3da32e2724320331c580bff062c359ab54c0783
|
3 |
+
size 19532414
|
checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/4.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6e185c9e5638e8837093ce2fd63afdf6cb4b417ce1d8db95b2c7645f80062f5b
|
3 |
+
size 19534854
|
checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/5.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3aa56e1cd946d475f901d97392a4af4a7db68408eb69f6899e76e950ad5516a0
|
3 |
+
size 19533396
|
checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/6.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6dc0f390e07ac7e24315a2566703dc62e1ea73539efe6bd9a6ed5c15040a1a0c
|
3 |
+
size 19533357
|
checkpoint_1007000/target.decoder.layers_2.mlp.wo.kernel/7.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a9fb389ef003cf74bad49f39fd47dfb919cceb86ada35cb40aa68aaf14629673
|
3 |
+
size 19533457
|
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/.zarray.__tmp11641026415366376429.~1663960300688455~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/.zarray.__tmp15086851991299262910.~1663960300424961~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:25e1c00d5eaa0c8f5a1e0891bf06abaac9dca314f5ac8b5b4b05a9da2f595b3c
|
3 |
+
size 7822461
|
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3932cd77623e7c6997d77b86b03172e7cc639a165b6f5abd683ae745d8fcec65
|
3 |
+
size 7809793
|
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:07f49750ccda07d043d28e3452a9b3fbd8c07e5417316c4f71c7d1579efea3be
|
3 |
+
size 7819818
|
checkpoint_1007000/target.decoder.layers_2.self_attention.value.kernel/0.7
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb7a70491144d33b915a8dfbef881d9da1faecb975a466193e2850923938a68e
|
3 |
+
size 7821231
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/.zarray.__tmp10223974096948240717.~1663960300774109~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/.zarray.__tmp11003946157143400568.~1663960300823025~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/.zarray.__tmp12169865525578298057.~1663960300420411~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/.zarray.__tmp15299951200537059570.~1663960300467147~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/.zarray.__tmp16754694326085659845.~1663960301030840~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/.zarray.__tmp6899721829295772493.~1663960300551877~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/.zarray.__tmp9305821517494390229.~1663960300351245~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:26055cc7ed2e1ece5872feddd5fddecc28f5ba9885d76a2c0746defb27860d46
|
3 |
+
size 7804341
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/1.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:04ac54db40bea6548e4c4be60cffad2454c3d35b278b3052a143259500af8ef2
|
3 |
+
size 7806506
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/2.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b7369015658cc9ddda4792bdcc7bcb90267aa3451778a7cc67d3df26d64d687
|
3 |
+
size 7804806
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/3.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1898486495207a39d5d327fac98c61113ebfa6ed63c3b90ca910ffc96fe21cb2
|
3 |
+
size 7804310
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/4.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:17b3f9f7409cb8d6082a348bf812db6f4d40c6b29c1b66b524a3dfd40c61c51e
|
3 |
+
size 7804346
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/5.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f85047671754b2eb56b7bc1d3f6dceacdb1e01d7ff0155e553f4091804a367e7
|
3 |
+
size 7805929
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/6.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0415deb3e23efd071840599f0b1df6eeeca04355600aab5e510f1881cffa160f
|
3 |
+
size 7805476
|
checkpoint_1007000/target.decoder.layers_20.encoder_decoder_attention.out.kernel/7.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8ac55656285cdab7032398a675b3aeea38b632b9b814b11510f5a868d6cc97e8
|
3 |
+
size 7803039
|
checkpoint_1007000/target.decoder.layers_3.pre_cross_attention_layer_norm.scale/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_3.pre_cross_attention_layer_norm.scale/0
ADDED
Binary file (14.9 kB). View file
|
|
checkpoint_1007000/target.decoder.layers_8.self_attention.out.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_8.self_attention.out.kernel/.zarray.__tmp1089770536934074408.~1663960300307684~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_8.self_attention.out.kernel/.zarray.__tmp14675306242868088798.~1663960300779261~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_8.self_attention.out.kernel/.zarray.__tmp15683271990944503386.~1663960300311869~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_8.self_attention.out.kernel/.zarray.__tmp2648441519406468586.~1663960300090606~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_8.self_attention.out.kernel/.zarray.__tmp4613967575850716566.~1663960300601965~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[512,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|