Commit
·
79e2321
1
Parent(s):
1e33f3e
Upload part 46
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +47 -0
- checkpoint_1007000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.encoder.layers_23.pre_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.encoder.layers_23.pre_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/.zarray.__tmp10130132370000382642.~1663960299882054~ +1 -0
- checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/.zarray.__tmp10954122248698558262.~1663960300073222~ +1 -0
- checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/.zarray.__tmp11709688572954520360.~1663960299677964~ +1 -0
- checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/.zarray.__tmp14956069949774084406.~1663960300075491~ +1 -0
- checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/.zarray.__tmp4025274537859120413.~1663960300017995~ +1 -0
- checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray.__tmp12479244418913466456.~1663960300685403~ +1 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray.__tmp5189599943241222398.~1663960300885553~ +1 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray.__tmp9533798046376307163.~1663960300551871~ +1 -0
- checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray.__tmp9666493176089962186.~1663960300686970~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray.__tmp10278330172052962831.~1663960300424944~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray.__tmp11926956483067476319.~1663960300385701~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray.__tmp15791834445691843274.~1663960300724828~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray.__tmp1714517278612008761.~1663960300466758~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray.__tmp18021455530413911774.~1663960300776722~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray.__tmp4364215189749523097.~1663960300420323~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray.__tmp5709416680492409645.~1663960300551197~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.7 +3 -0
- checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/.zarray +1 -0
- checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/.zarray.__tmp10398387860063871791.~1663960300385660~ +1 -0
- checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/.zarray.__tmp10700189453700589260.~1663960300778874~ +1 -0
- checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/.zarray.__tmp14196631297793674538.~1663960300685115~ +1 -0
- checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/.zarray.__tmp17083914858304621802.~1663960300989814~ +1 -0
- checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/.zarray.__tmp6968194478073802803.~1663960300548716~ +1 -0
- checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/.zarray.__tmp9240234483793240192.~1663960300610878~ +1 -0
- checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.0 +3 -0
- checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.1 +3 -0
- checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.2 +3 -0
- checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.3 +3 -0
.gitattributes
CHANGED
@@ -2339,3 +2339,50 @@ checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/7.0 filter=lfs diff=lf
|
|
2339 |
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
2340 |
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
2341 |
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2339 |
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
2340 |
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
2341 |
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
2342 |
+
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
2343 |
+
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
2344 |
+
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2345 |
+
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
2346 |
+
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
2347 |
+
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
2348 |
+
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
2349 |
+
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
2350 |
+
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
2351 |
+
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
2352 |
+
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2353 |
+
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
2354 |
+
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
2355 |
+
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
2356 |
+
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
2357 |
+
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
2358 |
+
checkpoint_1007000/target.encoder.layers_2.attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
2359 |
+
checkpoint_1007000/target.encoder.layers_2.attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
2360 |
+
checkpoint_1007000/target.encoder.layers_2.attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2361 |
+
checkpoint_1007000/target.encoder.layers_2.attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
2362 |
+
checkpoint_1007000/target.encoder.layers_2.attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
2363 |
+
checkpoint_1007000/target.encoder.layers_2.attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
2364 |
+
checkpoint_1007000/target.encoder.layers_2.attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
2365 |
+
checkpoint_1007000/target.encoder.layers_2.attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
2366 |
+
checkpoint_1007000/target.encoder.layers_23.attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
2367 |
+
checkpoint_1007000/target.encoder.layers_23.attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
2368 |
+
checkpoint_1007000/target.encoder.layers_23.attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2369 |
+
checkpoint_1007000/target.encoder.layers_23.attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
2370 |
+
checkpoint_1007000/target.encoder.layers_23.attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
2371 |
+
checkpoint_1007000/target.encoder.layers_23.attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
2372 |
+
checkpoint_1007000/target.encoder.layers_23.attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
2373 |
+
checkpoint_1007000/target.encoder.layers_23.attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
2374 |
+
checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
2375 |
+
checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
2376 |
+
checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2377 |
+
checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
2378 |
+
checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
2379 |
+
checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
2380 |
+
checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
2381 |
+
checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
2382 |
+
checkpoint_1007000/target.encoder.layers_15.attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
2383 |
+
checkpoint_1007000/target.encoder.layers_15.attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
2384 |
+
checkpoint_1007000/target.encoder.layers_15.attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2385 |
+
checkpoint_1007000/target.encoder.layers_15.attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
2386 |
+
checkpoint_1007000/target.encoder.layers_15.attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
2387 |
+
checkpoint_1007000/target.encoder.layers_15.attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
2388 |
+
checkpoint_1007000/target.encoder.layers_15.attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/0
ADDED
Binary file (15 kB). View file
|
|
checkpoint_1007000/state.param_states.encoder.layers_23.pre_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.encoder.layers_23.pre_attention_layer_norm.scale.v/0
ADDED
Binary file (14.8 kB). View file
|
|
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/.zarray.__tmp10130132370000382642.~1663960299882054~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/.zarray.__tmp10954122248698558262.~1663960300073222~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/.zarray.__tmp11709688572954520360.~1663960299677964~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/.zarray.__tmp14956069949774084406.~1663960300075491~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/.zarray.__tmp4025274537859120413.~1663960300017995~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a83c26214e409481a714f084ece9e067cca4762d0af8aadbe5857ba13d8b0489
|
3 |
+
size 7815472
|
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1c317d3ca1e1771c8d5960d333239c9edcd635ef9b51a2f61d25fcec1099851
|
3 |
+
size 7829309
|
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:21150fdd44d99220013d321faf65228101d41a5df30771c6fde236cf3bc81ad2
|
3 |
+
size 7815100
|
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bab84779b4c131b08620c70171a4a93e3bfb15a0f9f0904557461dcb131670e7
|
3 |
+
size 7812569
|
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c3770ae12dfce408e692544c4a112b3913e1403433b9a818f362a30046cb11a
|
3 |
+
size 7822649
|
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9d31f30e22520bd72134897be7def712846310aaf0435ebecf107a655664ffb5
|
3 |
+
size 7811908
|
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d1edf0f281f471f95e9d7c03b83831113eae2dd0f9dd1db13f95097f0ccab88
|
3 |
+
size 7819892
|
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.7
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dcac29c17010bb3cc600bb4c44199ff64454ff377a739c1ae328875e15b0a042
|
3 |
+
size 7818316
|
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray.__tmp12479244418913466456.~1663960300685403~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray.__tmp5189599943241222398.~1663960300885553~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray.__tmp9533798046376307163.~1663960300551871~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray.__tmp9666493176089962186.~1663960300686970~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray.__tmp10278330172052962831.~1663960300424944~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray.__tmp11926956483067476319.~1663960300385701~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray.__tmp15791834445691843274.~1663960300724828~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray.__tmp1714517278612008761.~1663960300466758~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray.__tmp18021455530413911774.~1663960300776722~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray.__tmp4364215189749523097.~1663960300420323~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray.__tmp5709416680492409645.~1663960300551197~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4634fa7bc859ab93145358e930f516b1af4d41af952c998beb0a5c19147ab2a8
|
3 |
+
size 19555434
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:288bec55b995218320f7376ac4ed1eaf3ddb0811a2cdf2af1ca4447d1ec3c4f2
|
3 |
+
size 19558146
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d74fa8efe1dadeea42b3622f085a18c86a92af50a676d25b6e7f46b1953947d6
|
3 |
+
size 19557656
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f55a8f784287b7fa506a4f2cc8129dbdb4458afb1886400f39c3e6f6f9e2c47a
|
3 |
+
size 19554736
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9af2dc6e88c0b52d3b2778c8da695120b4f4af775d75509a76d1c744ec670850
|
3 |
+
size 19559210
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:13f1571ec30c10983b517f469a67a0205478e823c23cc65ddfa6a99ef136add0
|
3 |
+
size 19554503
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8bed2a1d4defc5b51618e20425c92f0a80ece226cca3a30953b53574b7fbe590
|
3 |
+
size 19558320
|
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.7
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f9aa132b4adfb8e7d663f0897aa41c39ce0c64fa30c8fd078db837654248c08
|
3 |
+
size 19556316
|
checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/.zarray.__tmp10398387860063871791.~1663960300385660~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/.zarray.__tmp10700189453700589260.~1663960300778874~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/.zarray.__tmp14196631297793674538.~1663960300685115~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/.zarray.__tmp17083914858304621802.~1663960300989814~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/.zarray.__tmp6968194478073802803.~1663960300548716~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/.zarray.__tmp9240234483793240192.~1663960300610878~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8bac07b58214c98ef696ca8fcfb2bea453d2da5fafe98a4356c6817e7062d7bf
|
3 |
+
size 7807422
|
checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7753b3cce5efb8ce609ce0728fb7ace2da8186da69b338d25dcb9fc80dd05b6a
|
3 |
+
size 7810124
|
checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59bccb8735f098b3d33ecb29e500e8860d1b897e6ecac939b30cd116c8c4e7fb
|
3 |
+
size 7807194
|
checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9afa991b4eb47d4f2312701000efa22643791e5045668990a9bca467331f15e
|
3 |
+
size 7810691
|