Commit
·
b0438b3
1
Parent(s):
e6333a8
Upload part 69
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +44 -0
- checkpoint_1007000/state.param_states.decoder.layers_19.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_19.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.decoder.layers_22.pre_self_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_22.pre_self_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.decoder.layers_9.pre_self_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_9.pre_self_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.encoder.layers_15.pre_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.encoder.layers_15.pre_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.encoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.encoder.layers_3.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray.__tmp10110197242313532362.~1663960300134224~ +1 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray.__tmp10286619748446951564.~1663960300075313~ +1 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray.__tmp10967580320069937423.~1663960300016844~ +1 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray.__tmp16759264667472233231.~1663960300548020~ +1 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray.__tmp18273606472686788359.~1663960300090522~ +1 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray.__tmp2080791846667276183.~1663960299724161~ +1 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray.__tmp518315626624162999.~1663960299928038~ +1 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/1.0 +3 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/2.0 +3 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/3.0 +3 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/4.0 +3 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/5.0 +3 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/6.0 +3 -0
- checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/7.0 +3 -0
- checkpoint_1007000/target.decoder.layers_18.pre_cross_attention_layer_norm.scale/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_18.pre_cross_attention_layer_norm.scale/0 +0 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray.__tmp14327996386050127580.~1663960300873999~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray.__tmp17032425602126076780.~1663960300497654~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray.__tmp1753918392538626836.~1663960300685740~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray.__tmp3294400150320527675.~1663960300599494~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray.__tmp3346837884784373481.~1663960300471058~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray.__tmp5366360317273826532.~1663960300887653~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray.__tmp9189606845200779608.~1663960300888237~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_4.mlp.wo.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_4.mlp.wo.kernel/.zarray.__tmp12689500621936917338.~1663960300387560~ +1 -0
- checkpoint_1007000/target.decoder.layers_4.mlp.wo.kernel/.zarray.__tmp12826010473743220668.~1663960300466418~ +1 -0
.gitattributes
CHANGED
@@ -3415,3 +3415,47 @@ checkpoint_1007000/target.encoder.layers_1.attention.key.kernel/0.1 filter=lfs d
|
|
3415 |
checkpoint_1007000/target.encoder.layers_1.attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
3416 |
checkpoint_1007000/target.encoder.layers_1.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
3417 |
checkpoint_1007000/target.encoder.layers_1.attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
3415 |
checkpoint_1007000/target.encoder.layers_1.attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
3416 |
checkpoint_1007000/target.encoder.layers_1.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
3417 |
checkpoint_1007000/target.encoder.layers_1.attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
3418 |
+
checkpoint_1007000/target.encoder.layers_1.attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
3419 |
+
checkpoint_1007000/target.encoder.layers_1.attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
3420 |
+
checkpoint_1007000/target.encoder.layers_1.attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
3421 |
+
checkpoint_1007000/target.encoder.layers_1.attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
3422 |
+
checkpoint_1007000/target.encoder.layers_18.attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
3423 |
+
checkpoint_1007000/target.encoder.layers_18.attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
3424 |
+
checkpoint_1007000/target.encoder.layers_18.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
3425 |
+
checkpoint_1007000/target.encoder.layers_18.attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
3426 |
+
checkpoint_1007000/target.encoder.layers_18.attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
3427 |
+
checkpoint_1007000/target.encoder.layers_18.attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
3428 |
+
checkpoint_1007000/target.encoder.layers_18.attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
3429 |
+
checkpoint_1007000/target.encoder.layers_18.attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
3430 |
+
checkpoint_1007000/target.decoder.layers_4.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
3431 |
+
checkpoint_1007000/target.decoder.layers_4.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
3432 |
+
checkpoint_1007000/target.decoder.layers_4.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
3433 |
+
checkpoint_1007000/target.decoder.layers_4.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
3434 |
+
checkpoint_1007000/target.decoder.layers_4.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
3435 |
+
checkpoint_1007000/target.decoder.layers_4.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
3436 |
+
checkpoint_1007000/target.decoder.layers_4.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
3437 |
+
checkpoint_1007000/target.decoder.layers_4.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
3438 |
+
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
3439 |
+
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
3440 |
+
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
3441 |
+
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
3442 |
+
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
3443 |
+
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
3444 |
+
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
3445 |
+
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
3446 |
+
checkpoint_1007000/target.encoder.layers_19.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
3447 |
+
checkpoint_1007000/target.encoder.layers_19.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
3448 |
+
checkpoint_1007000/target.encoder.layers_19.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
3449 |
+
checkpoint_1007000/target.encoder.layers_19.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
3450 |
+
checkpoint_1007000/target.encoder.layers_19.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
3451 |
+
checkpoint_1007000/target.encoder.layers_19.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
3452 |
+
checkpoint_1007000/target.encoder.layers_19.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
3453 |
+
checkpoint_1007000/target.encoder.layers_19.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
3454 |
+
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
3455 |
+
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
3456 |
+
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
3457 |
+
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
3458 |
+
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
3459 |
+
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
3460 |
+
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
3461 |
+
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/state.param_states.decoder.layers_19.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_19.pre_mlp_layer_norm.scale.v/0
ADDED
Binary file (14.5 kB). View file
|
|
checkpoint_1007000/state.param_states.decoder.layers_22.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_22.pre_self_attention_layer_norm.scale.v/0
ADDED
Binary file (14.3 kB). View file
|
|
checkpoint_1007000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/0
ADDED
Binary file (14.8 kB). View file
|
|
checkpoint_1007000/state.param_states.decoder.layers_9.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_9.pre_self_attention_layer_norm.scale.v/0
ADDED
Binary file (15.1 kB). View file
|
|
checkpoint_1007000/state.param_states.encoder.layers_15.pre_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.encoder.layers_15.pre_attention_layer_norm.scale.v/0
ADDED
Binary file (15.2 kB). View file
|
|
checkpoint_1007000/state.param_states.encoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.encoder.layers_3.pre_mlp_layer_norm.scale.v/0
ADDED
Binary file (15.3 kB). View file
|
|
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray.__tmp10110197242313532362.~1663960300134224~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray.__tmp10286619748446951564.~1663960300075313~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray.__tmp10967580320069937423.~1663960300016844~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray.__tmp16759264667472233231.~1663960300548020~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray.__tmp18273606472686788359.~1663960300090522~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray.__tmp2080791846667276183.~1663960299724161~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray.__tmp518315626624162999.~1663960299928038~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:365a39068ec56b2a772bc2f92bc2ac93b346d38e75508feb9319031a774aa69e
|
3 |
+
size 19533167
|
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/1.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f33fe7d8dd30b262bcd4bc823214da106af1712c43d0f0c116130cab9eb4fb3
|
3 |
+
size 19533024
|
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/2.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f388bc06c8cedec52cca4a582667de0a9ccd10fa548738650528c9869f0e44e6
|
3 |
+
size 19533703
|
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/3.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:afe0fd96f95d0a2498489d4b94434e5cbd1bac3ffab63756a4c9834641b77562
|
3 |
+
size 19534390
|
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/4.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5e2874bff20cbeed9a5d32a83bc6ec711ed523966929c8c8ad9e47b0ac7161a
|
3 |
+
size 19532712
|
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/5.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5997959a9e6107b5165772d674d1fa0a998aab5b3e135a3ba45b9b9a96f2a1f1
|
3 |
+
size 19533820
|
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/6.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e224a2bf0cbe670b182b981cc0ef17b3c9ac56d4dd3e0db19bf890cde1ac9f2a
|
3 |
+
size 19534103
|
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/7.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02012ec2c592fc78bae9ea1e49a39c7720775d1ab5a1255831f51669dc7acf74
|
3 |
+
size 19533710
|
checkpoint_1007000/target.decoder.layers_18.pre_cross_attention_layer_norm.scale/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.pre_cross_attention_layer_norm.scale/0
ADDED
Binary file (14.7 kB). View file
|
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray.__tmp14327996386050127580.~1663960300873999~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray.__tmp17032425602126076780.~1663960300497654~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray.__tmp1753918392538626836.~1663960300685740~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray.__tmp3294400150320527675.~1663960300599494~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray.__tmp3346837884784373481.~1663960300471058~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray.__tmp5366360317273826532.~1663960300887653~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray.__tmp9189606845200779608.~1663960300888237~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aab9176229d836379b69949913e6764516e6d5042cc2bcd94401359bf76d7018
|
3 |
+
size 19496376
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7e8b748c2bffc82e3cc34bd458c94cb02940dc40afc9d2d12d66e921b34763dc
|
3 |
+
size 19496861
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1b077faa8610c0ef903776c348a8757a633fdee97eba5b3da4d325cf2586acc6
|
3 |
+
size 19496752
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be00813515261c4f3121cc3ec61aeb810c4377b2944ed37f260442fb73e1057d
|
3 |
+
size 19496513
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:91b58f63e180e2acff3493e7c1861ea6964515c0660cbc9fc5a6b05a4c977940
|
3 |
+
size 19496845
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:88510a82f225899aaa8ab8dafcdac8901c3a86e80ef3ee370209864760ea033b
|
3 |
+
size 19496641
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ffb93d19ca61328b1f309110187c6208add98018bb0540f3246b76401cb20c20
|
3 |
+
size 19495657
|
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.7
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df5f781e40042921452fe36d2ac956bcad4ce1330f3c20d1992cea466b888787
|
3 |
+
size 19496371
|
checkpoint_1007000/target.decoder.layers_4.mlp.wo.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_4.mlp.wo.kernel/.zarray.__tmp12689500621936917338.~1663960300387560~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_4.mlp.wo.kernel/.zarray.__tmp12826010473743220668.~1663960300466418~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
|