Commit
·
7f770c6
1
Parent(s):
bf6a00d
Update tokenization_rwkv_world.py
Browse files
tokenization_rwkv_world.py
CHANGED
|
@@ -202,7 +202,8 @@ class RWKVWorldTokenizer(PreTrainedTokenizer):
|
|
| 202 |
return tokens
|
| 203 |
|
| 204 |
def decodeBytes(self, tokens):
|
| 205 |
-
|
|
|
|
| 206 |
|
| 207 |
def _tokenize(self, text, **kwargs):
|
| 208 |
"""Tokenize a string."""
|
|
|
|
| 202 |
return tokens
|
| 203 |
|
| 204 |
def decodeBytes(self, tokens):
|
| 205 |
+
byte_sequence = [self.encoder[i] for i in tokens if i != 0]
|
| 206 |
+
return b''.join(byte_sequence)
|
| 207 |
|
| 208 |
def _tokenize(self, text, **kwargs):
|
| 209 |
"""Tokenize a string."""
|