TimeRobber commited on
Commit
b0438b3
·
1 Parent(s): e6333a8

Upload part 69

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +44 -0
  2. checkpoint_1007000/state.param_states.decoder.layers_19.pre_mlp_layer_norm.scale.v/.zarray +1 -0
  3. checkpoint_1007000/state.param_states.decoder.layers_19.pre_mlp_layer_norm.scale.v/0 +0 -0
  4. checkpoint_1007000/state.param_states.decoder.layers_22.pre_self_attention_layer_norm.scale.v/.zarray +1 -0
  5. checkpoint_1007000/state.param_states.decoder.layers_22.pre_self_attention_layer_norm.scale.v/0 +0 -0
  6. checkpoint_1007000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray +1 -0
  7. checkpoint_1007000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/0 +0 -0
  8. checkpoint_1007000/state.param_states.decoder.layers_9.pre_self_attention_layer_norm.scale.v/.zarray +1 -0
  9. checkpoint_1007000/state.param_states.decoder.layers_9.pre_self_attention_layer_norm.scale.v/0 +0 -0
  10. checkpoint_1007000/state.param_states.encoder.layers_15.pre_attention_layer_norm.scale.v/.zarray +1 -0
  11. checkpoint_1007000/state.param_states.encoder.layers_15.pre_attention_layer_norm.scale.v/0 +0 -0
  12. checkpoint_1007000/state.param_states.encoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray +1 -0
  13. checkpoint_1007000/state.param_states.encoder.layers_3.pre_mlp_layer_norm.scale.v/0 +0 -0
  14. checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray +1 -0
  15. checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray.__tmp10110197242313532362.~1663960300134224~ +1 -0
  16. checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray.__tmp10286619748446951564.~1663960300075313~ +1 -0
  17. checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray.__tmp10967580320069937423.~1663960300016844~ +1 -0
  18. checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray.__tmp16759264667472233231.~1663960300548020~ +1 -0
  19. checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray.__tmp18273606472686788359.~1663960300090522~ +1 -0
  20. checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray.__tmp2080791846667276183.~1663960299724161~ +1 -0
  21. checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray.__tmp518315626624162999.~1663960299928038~ +1 -0
  22. checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/0.0 +3 -0
  23. checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/1.0 +3 -0
  24. checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/2.0 +3 -0
  25. checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/3.0 +3 -0
  26. checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/4.0 +3 -0
  27. checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/5.0 +3 -0
  28. checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/6.0 +3 -0
  29. checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/7.0 +3 -0
  30. checkpoint_1007000/target.decoder.layers_18.pre_cross_attention_layer_norm.scale/.zarray +1 -0
  31. checkpoint_1007000/target.decoder.layers_18.pre_cross_attention_layer_norm.scale/0 +0 -0
  32. checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray +1 -0
  33. checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray.__tmp14327996386050127580.~1663960300873999~ +1 -0
  34. checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray.__tmp17032425602126076780.~1663960300497654~ +1 -0
  35. checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray.__tmp1753918392538626836.~1663960300685740~ +1 -0
  36. checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray.__tmp3294400150320527675.~1663960300599494~ +1 -0
  37. checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray.__tmp3346837884784373481.~1663960300471058~ +1 -0
  38. checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray.__tmp5366360317273826532.~1663960300887653~ +1 -0
  39. checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray.__tmp9189606845200779608.~1663960300888237~ +1 -0
  40. checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.0 +3 -0
  41. checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.1 +3 -0
  42. checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.2 +3 -0
  43. checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.3 +3 -0
  44. checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.4 +3 -0
  45. checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.5 +3 -0
  46. checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.6 +3 -0
  47. checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.7 +3 -0
  48. checkpoint_1007000/target.decoder.layers_4.mlp.wo.kernel/.zarray +1 -0
  49. checkpoint_1007000/target.decoder.layers_4.mlp.wo.kernel/.zarray.__tmp12689500621936917338.~1663960300387560~ +1 -0
  50. checkpoint_1007000/target.decoder.layers_4.mlp.wo.kernel/.zarray.__tmp12826010473743220668.~1663960300466418~ +1 -0
.gitattributes CHANGED
@@ -3415,3 +3415,47 @@ checkpoint_1007000/target.encoder.layers_1.attention.key.kernel/0.1 filter=lfs d
3415
  checkpoint_1007000/target.encoder.layers_1.attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
3416
  checkpoint_1007000/target.encoder.layers_1.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
3417
  checkpoint_1007000/target.encoder.layers_1.attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3415
  checkpoint_1007000/target.encoder.layers_1.attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
3416
  checkpoint_1007000/target.encoder.layers_1.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
3417
  checkpoint_1007000/target.encoder.layers_1.attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
3418
+ checkpoint_1007000/target.encoder.layers_1.attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
3419
+ checkpoint_1007000/target.encoder.layers_1.attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
3420
+ checkpoint_1007000/target.encoder.layers_1.attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
3421
+ checkpoint_1007000/target.encoder.layers_1.attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
3422
+ checkpoint_1007000/target.encoder.layers_18.attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
3423
+ checkpoint_1007000/target.encoder.layers_18.attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
3424
+ checkpoint_1007000/target.encoder.layers_18.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
3425
+ checkpoint_1007000/target.encoder.layers_18.attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
3426
+ checkpoint_1007000/target.encoder.layers_18.attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
3427
+ checkpoint_1007000/target.encoder.layers_18.attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
3428
+ checkpoint_1007000/target.encoder.layers_18.attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
3429
+ checkpoint_1007000/target.encoder.layers_18.attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
3430
+ checkpoint_1007000/target.decoder.layers_4.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
3431
+ checkpoint_1007000/target.decoder.layers_4.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
3432
+ checkpoint_1007000/target.decoder.layers_4.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
3433
+ checkpoint_1007000/target.decoder.layers_4.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
3434
+ checkpoint_1007000/target.decoder.layers_4.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
3435
+ checkpoint_1007000/target.decoder.layers_4.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
3436
+ checkpoint_1007000/target.decoder.layers_4.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
3437
+ checkpoint_1007000/target.decoder.layers_4.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
3438
+ checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
3439
+ checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
3440
+ checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
3441
+ checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
3442
+ checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
3443
+ checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
3444
+ checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
3445
+ checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
3446
+ checkpoint_1007000/target.encoder.layers_19.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
3447
+ checkpoint_1007000/target.encoder.layers_19.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
3448
+ checkpoint_1007000/target.encoder.layers_19.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
3449
+ checkpoint_1007000/target.encoder.layers_19.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
3450
+ checkpoint_1007000/target.encoder.layers_19.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
3451
+ checkpoint_1007000/target.encoder.layers_19.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
3452
+ checkpoint_1007000/target.encoder.layers_19.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
3453
+ checkpoint_1007000/target.encoder.layers_19.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
3454
+ checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
3455
+ checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
3456
+ checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
3457
+ checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
3458
+ checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
3459
+ checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
3460
+ checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
3461
+ checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
checkpoint_1007000/state.param_states.decoder.layers_19.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
checkpoint_1007000/state.param_states.decoder.layers_19.pre_mlp_layer_norm.scale.v/0 ADDED
Binary file (14.5 kB). View file
 
checkpoint_1007000/state.param_states.decoder.layers_22.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
checkpoint_1007000/state.param_states.decoder.layers_22.pre_self_attention_layer_norm.scale.v/0 ADDED
Binary file (14.3 kB). View file
 
checkpoint_1007000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
checkpoint_1007000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/0 ADDED
Binary file (14.8 kB). View file
 
checkpoint_1007000/state.param_states.decoder.layers_9.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
checkpoint_1007000/state.param_states.decoder.layers_9.pre_self_attention_layer_norm.scale.v/0 ADDED
Binary file (15.1 kB). View file
 
checkpoint_1007000/state.param_states.encoder.layers_15.pre_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
checkpoint_1007000/state.param_states.encoder.layers_15.pre_attention_layer_norm.scale.v/0 ADDED
Binary file (15.2 kB). View file
 
checkpoint_1007000/state.param_states.encoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
checkpoint_1007000/state.param_states.encoder.layers_3.pre_mlp_layer_norm.scale.v/0 ADDED
Binary file (15.3 kB). View file
 
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray.__tmp10110197242313532362.~1663960300134224~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray.__tmp10286619748446951564.~1663960300075313~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray.__tmp10967580320069937423.~1663960300016844~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray.__tmp16759264667472233231.~1663960300548020~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray.__tmp18273606472686788359.~1663960300090522~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray.__tmp2080791846667276183.~1663960299724161~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/.zarray.__tmp518315626624162999.~1663960299928038~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:365a39068ec56b2a772bc2f92bc2ac93b346d38e75508feb9319031a774aa69e
3
+ size 19533167
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/1.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f33fe7d8dd30b262bcd4bc823214da106af1712c43d0f0c116130cab9eb4fb3
3
+ size 19533024
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/2.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f388bc06c8cedec52cca4a582667de0a9ccd10fa548738650528c9869f0e44e6
3
+ size 19533703
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/3.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afe0fd96f95d0a2498489d4b94434e5cbd1bac3ffab63756a4c9834641b77562
3
+ size 19534390
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/4.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5e2874bff20cbeed9a5d32a83bc6ec711ed523966929c8c8ad9e47b0ac7161a
3
+ size 19532712
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/5.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5997959a9e6107b5165772d674d1fa0a998aab5b3e135a3ba45b9b9a96f2a1f1
3
+ size 19533820
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/6.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e224a2bf0cbe670b182b981cc0ef17b3c9ac56d4dd3e0db19bf890cde1ac9f2a
3
+ size 19534103
checkpoint_1007000/target.decoder.layers_0.mlp.wo.kernel/7.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02012ec2c592fc78bae9ea1e49a39c7720775d1ab5a1255831f51669dc7acf74
3
+ size 19533710
checkpoint_1007000/target.decoder.layers_18.pre_cross_attention_layer_norm.scale/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_18.pre_cross_attention_layer_norm.scale/0 ADDED
Binary file (14.7 kB). View file
 
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray.__tmp14327996386050127580.~1663960300873999~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray.__tmp17032425602126076780.~1663960300497654~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray.__tmp1753918392538626836.~1663960300685740~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray.__tmp3294400150320527675.~1663960300599494~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray.__tmp3346837884784373481.~1663960300471058~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray.__tmp5366360317273826532.~1663960300887653~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/.zarray.__tmp9189606845200779608.~1663960300888237~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aab9176229d836379b69949913e6764516e6d5042cc2bcd94401359bf76d7018
3
+ size 19496376
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e8b748c2bffc82e3cc34bd458c94cb02940dc40afc9d2d12d66e921b34763dc
3
+ size 19496861
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b077faa8610c0ef903776c348a8757a633fdee97eba5b3da4d325cf2586acc6
3
+ size 19496752
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be00813515261c4f3121cc3ec61aeb810c4377b2944ed37f260442fb73e1057d
3
+ size 19496513
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91b58f63e180e2acff3493e7c1861ea6964515c0660cbc9fc5a6b05a4c977940
3
+ size 19496845
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88510a82f225899aaa8ab8dafcdac8901c3a86e80ef3ee370209864760ea033b
3
+ size 19496641
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffb93d19ca61328b1f309110187c6208add98018bb0540f3246b76401cb20c20
3
+ size 19495657
checkpoint_1007000/target.decoder.layers_20.mlp.wi_1.kernel/0.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df5f781e40042921452fe36d2ac956bcad4ce1330f3c20d1992cea466b888787
3
+ size 19496371
checkpoint_1007000/target.decoder.layers_4.mlp.wo.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_4.mlp.wo.kernel/.zarray.__tmp12689500621936917338.~1663960300387560~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_4.mlp.wo.kernel/.zarray.__tmp12826010473743220668.~1663960300466418~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}