Upload tokenizer
Browse files- tokenizer.json +4 -2
tokenizer.json
CHANGED
|
@@ -955,7 +955,8 @@
|
|
| 955 |
{
|
| 956 |
"type": "Metaspace",
|
| 957 |
"replacement": "▁",
|
| 958 |
-
"add_prefix_space": true
|
|
|
|
| 959 |
},
|
| 960 |
{
|
| 961 |
"type": "Digits",
|
|
@@ -1012,7 +1013,8 @@
|
|
| 1012 |
"decoder": {
|
| 1013 |
"type": "Metaspace",
|
| 1014 |
"replacement": "▁",
|
| 1015 |
-
"add_prefix_space": true
|
|
|
|
| 1016 |
},
|
| 1017 |
"model": {
|
| 1018 |
"type": "Unigram",
|
|
|
|
| 955 |
{
|
| 956 |
"type": "Metaspace",
|
| 957 |
"replacement": "▁",
|
| 958 |
+
"add_prefix_space": true,
|
| 959 |
+
"prepend_scheme": "always"
|
| 960 |
},
|
| 961 |
{
|
| 962 |
"type": "Digits",
|
|
|
|
| 1013 |
"decoder": {
|
| 1014 |
"type": "Metaspace",
|
| 1015 |
"replacement": "▁",
|
| 1016 |
+
"add_prefix_space": true,
|
| 1017 |
+
"prepend_scheme": "always"
|
| 1018 |
},
|
| 1019 |
"model": {
|
| 1020 |
"type": "Unigram",
|