KaleiNeely
commited on
Commit
•
beb1045
1
Parent(s):
357d495
Update tokenization_rwkv_world.py
Browse files
tokenization_rwkv_world.py
CHANGED
@@ -202,7 +202,8 @@ class RWKVWorldTokenizer(PreTrainedTokenizer):
|
|
202 |
return tokens
|
203 |
|
204 |
def decodeBytes(self, tokens):
|
205 |
-
|
|
|
206 |
|
207 |
def _tokenize(self, text, **kwargs):
|
208 |
"""Tokenize a string."""
|
|
|
202 |
return tokens
|
203 |
|
204 |
def decodeBytes(self, tokens):
|
205 |
+
byte_sequence = [self.encoder[i] for i in tokens if i != 0]
|
206 |
+
return b''.join(byte_sequence)
|
207 |
|
208 |
def _tokenize(self, text, **kwargs):
|
209 |
"""Tokenize a string."""
|