TimeRobber commited on
Commit
fde254a
·
1 Parent(s): 960b0d6

Upload part 53

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +48 -0
  2. checkpoint_1007000/state.param_states.decoder.layers_23.pre_mlp_layer_norm.scale.v/.zarray +1 -0
  3. checkpoint_1007000/state.param_states.decoder.layers_23.pre_mlp_layer_norm.scale.v/0 +0 -0
  4. checkpoint_1007000/target.decoder.layers_12.pre_mlp_layer_norm.scale/.zarray +1 -0
  5. checkpoint_1007000/target.decoder.layers_12.pre_mlp_layer_norm.scale/0 +0 -0
  6. checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray +1 -0
  7. checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray.__tmp11256787251253775817.~1663960300467721~ +1 -0
  8. checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray.__tmp12376700607849326301.~1663960300873893~ +1 -0
  9. checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray.__tmp13988132894120306426.~1663960300465831~ +1 -0
  10. checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray.__tmp2003657211397809811.~1663960300499679~ +1 -0
  11. checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray.__tmp3018502066720724520.~1663960300422243~ +1 -0
  12. checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray.__tmp5367369300786217474.~1663960300272671~ +1 -0
  13. checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray.__tmp9890861163220608993.~1663960300865166~ +1 -0
  14. checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/0.0 +3 -0
  15. checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/1.0 +3 -0
  16. checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/2.0 +3 -0
  17. checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/3.0 +3 -0
  18. checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/4.0 +3 -0
  19. checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/5.0 +3 -0
  20. checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/6.0 +3 -0
  21. checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/7.0 +3 -0
  22. checkpoint_1007000/target.decoder.layers_5.pre_self_attention_layer_norm.scale/.zarray +1 -0
  23. checkpoint_1007000/target.decoder.layers_5.pre_self_attention_layer_norm.scale/0 +0 -0
  24. checkpoint_1007000/target.decoder.layers_7.pre_mlp_layer_norm.scale/.zarray +1 -0
  25. checkpoint_1007000/target.decoder.layers_7.pre_mlp_layer_norm.scale/0 +0 -0
  26. checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray +1 -0
  27. checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray.__tmp14160688709433772055.~1663960300611045~ +1 -0
  28. checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray.__tmp15873416349169901159.~1663960300826076~ +1 -0
  29. checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray.__tmp16849527841429843420.~1663960300468248~ +1 -0
  30. checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray.__tmp4255918781242121777.~1663960300779427~ +1 -0
  31. checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray.__tmp4421445606442611016.~1663960300384782~ +1 -0
  32. checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray.__tmp4539221328564997070.~1663960300600813~ +1 -0
  33. checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray.__tmp9398104159734428444.~1663960300688560~ +1 -0
  34. checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.0 +3 -0
  35. checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.1 +3 -0
  36. checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.2 +3 -0
  37. checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.3 +3 -0
  38. checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.4 +3 -0
  39. checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.5 +3 -0
  40. checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.6 +3 -0
  41. checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.7 +3 -0
  42. checkpoint_1007000/target.encoder.layers_13.pre_attention_layer_norm.scale/.zarray +1 -0
  43. checkpoint_1007000/target.encoder.layers_13.pre_attention_layer_norm.scale/0 +0 -0
  44. checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/.zarray +1 -0
  45. checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/.zarray.__tmp11915811710181766548.~1663960300425573~ +1 -0
  46. checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/.zarray.__tmp12223102092994640126.~1663960300724757~ +1 -0
  47. checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/.zarray.__tmp16570448508998648983.~1663960300609977~ +1 -0
  48. checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/.zarray.__tmp17425754235712849754.~1663960300421170~ +1 -0
  49. checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/.zarray.__tmp1843410830924711088.~1663960300545905~ +1 -0
  50. checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/.zarray.__tmp5183710400972140093.~1663960300626578~ +1 -0
.gitattributes CHANGED
@@ -2673,3 +2673,51 @@ checkpoint_1007000/target.encoder.layers_8.attention.out.kernel/3.0 filter=lfs d
2673
  checkpoint_1007000/target.encoder.layers_8.attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2674
  checkpoint_1007000/target.encoder.layers_8.attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
2675
  checkpoint_1007000/target.encoder.layers_8.attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2673
  checkpoint_1007000/target.encoder.layers_8.attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2674
  checkpoint_1007000/target.encoder.layers_8.attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
2675
  checkpoint_1007000/target.encoder.layers_8.attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
2676
+ checkpoint_1007000/target.encoder.layers_8.attention.out.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
2677
+ checkpoint_1007000/target.encoder.layers_8.attention.out.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
2678
+ checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
2679
+ checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2680
+ checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2681
+ checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
2682
+ checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
2683
+ checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
2684
+ checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
2685
+ checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2686
+ checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
2687
+ checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
2688
+ checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
2689
+ checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2690
+ checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
2691
+ checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
2692
+ checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
2693
+ checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
2694
+ checkpoint_1007000/target.encoder.layers_20.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
2695
+ checkpoint_1007000/target.encoder.layers_20.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2696
+ checkpoint_1007000/target.encoder.layers_20.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2697
+ checkpoint_1007000/target.encoder.layers_20.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
2698
+ checkpoint_1007000/target.encoder.layers_20.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
2699
+ checkpoint_1007000/target.encoder.layers_20.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
2700
+ checkpoint_1007000/target.encoder.layers_20.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
2701
+ checkpoint_1007000/target.encoder.layers_20.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2702
+ checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
2703
+ checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2704
+ checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2705
+ checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
2706
+ checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
2707
+ checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
2708
+ checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
2709
+ checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2710
+ checkpoint_1007000/target.encoder.layers_3.attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
2711
+ checkpoint_1007000/target.encoder.layers_3.attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2712
+ checkpoint_1007000/target.encoder.layers_3.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2713
+ checkpoint_1007000/target.encoder.layers_3.attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
2714
+ checkpoint_1007000/target.encoder.layers_3.attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
2715
+ checkpoint_1007000/target.encoder.layers_3.attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
2716
+ checkpoint_1007000/target.encoder.layers_3.attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
2717
+ checkpoint_1007000/target.encoder.layers_3.attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2718
+ checkpoint_1007000/target.encoder.layers_19.attention.out.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
2719
+ checkpoint_1007000/target.encoder.layers_19.attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
2720
+ checkpoint_1007000/target.encoder.layers_19.attention.out.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
2721
+ checkpoint_1007000/target.encoder.layers_19.attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2722
+ checkpoint_1007000/target.encoder.layers_19.attention.out.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
2723
+ checkpoint_1007000/target.encoder.layers_19.attention.out.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
checkpoint_1007000/state.param_states.decoder.layers_23.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
checkpoint_1007000/state.param_states.decoder.layers_23.pre_mlp_layer_norm.scale.v/0 ADDED
Binary file (14.4 kB). View file
 
checkpoint_1007000/target.decoder.layers_12.pre_mlp_layer_norm.scale/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_12.pre_mlp_layer_norm.scale/0 ADDED
Binary file (14.7 kB). View file
 
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray.__tmp11256787251253775817.~1663960300467721~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray.__tmp12376700607849326301.~1663960300873893~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray.__tmp13988132894120306426.~1663960300465831~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray.__tmp2003657211397809811.~1663960300499679~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray.__tmp3018502066720724520.~1663960300422243~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray.__tmp5367369300786217474.~1663960300272671~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/.zarray.__tmp9890861163220608993.~1663960300865166~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4cd567082bc1f857b9b74c39f20a14a54305030750f427447b78060559ccd655
3
+ size 19536740
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/1.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7f042ee0239a3d75d39afe8aa605232aeb518a417baf6fe51b4dc678b69362f
3
+ size 19536437
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/2.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1740f1ff22b516d28755469b4ad3d05f5b5c482bee78c865d9ebd95ccdbf1fc5
3
+ size 19537072
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/3.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de72446230ffd496ba585f0789ac98497f83e8209c566efbe56df1f47f6cb308
3
+ size 19535933
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/4.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af0711164d99a304bef96bce45cacb8755fdd45d4cad80c8d78608f58fb2c24b
3
+ size 19536727
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/5.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6d2c6d716aa8dc6e97c4eb957c36551d34654a313302a99c4c9a5e5e59cf415
3
+ size 19536375
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/6.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:514530b30562578cf9a28b04e3162478be54e63b7528c5c919b6d5aefa2bb237
3
+ size 19538075
checkpoint_1007000/target.decoder.layers_17.mlp.wo.kernel/7.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f16d2ad632fc66c5557464c7e93cb0bffa99c5a69ca6918743599d2bff9cdbc4
3
+ size 19536537
checkpoint_1007000/target.decoder.layers_5.pre_self_attention_layer_norm.scale/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_5.pre_self_attention_layer_norm.scale/0 ADDED
Binary file (15 kB). View file
 
checkpoint_1007000/target.decoder.layers_7.pre_mlp_layer_norm.scale/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_7.pre_mlp_layer_norm.scale/0 ADDED
Binary file (14.7 kB). View file
 
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray.__tmp14160688709433772055.~1663960300611045~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray.__tmp15873416349169901159.~1663960300826076~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray.__tmp16849527841429843420.~1663960300468248~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray.__tmp4255918781242121777.~1663960300779427~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray.__tmp4421445606442611016.~1663960300384782~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray.__tmp4539221328564997070.~1663960300600813~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/.zarray.__tmp9398104159734428444.~1663960300688560~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84b18db2f91f2930220701c7ee39da698d3f6bb679e1f82ac04f67ed6c660c70
3
+ size 7820805
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17baf72eb0cd4b6bd3ef9ac000c04e00462a0b8f9a71bf2fe45b1ba47ac8747e
3
+ size 7821468
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc7364a6be8a0c3a59b9980a7dd2d2efc2d525e6ca7756e1bafbc097e22598a5
3
+ size 7821758
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b6600f27687e4f790246618db3c46d1b7875fe1af316996a7d5144c3c843026
3
+ size 7822096
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c42cd53d4d32e7063f179d3103805595770bd55f51de131ddab5617c126608b
3
+ size 7822824
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0392651ed9dda37b1230de96fc28b1c31fcaa91bd35738f9fdf98e80d890d665
3
+ size 7820366
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96a6fc8fb0b7262fe49ea1801870c6026fd0125d8e4848719974871ebe3d4c44
3
+ size 7821561
checkpoint_1007000/target.decoder.layers_7.self_attention.value.kernel/0.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:035628cf1a31400d6bd3b3e07b19dc58102cb4f9a9114de20359520009cf847c
3
+ size 7821431
checkpoint_1007000/target.encoder.layers_13.pre_attention_layer_norm.scale/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
checkpoint_1007000/target.encoder.layers_13.pre_attention_layer_norm.scale/0 ADDED
Binary file (15.1 kB). View file
 
checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/.zarray.__tmp11915811710181766548.~1663960300425573~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/.zarray.__tmp12223102092994640126.~1663960300724757~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/.zarray.__tmp16570448508998648983.~1663960300609977~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/.zarray.__tmp17425754235712849754.~1663960300421170~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/.zarray.__tmp1843410830924711088.~1663960300545905~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.encoder.layers_15.attention.key.kernel/.zarray.__tmp5183710400972140093.~1663960300626578~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}