Spaces:
Running
on
Zero
Running
on
Zero
# Copyright (c) Meta Platforms, Inc. and affiliates. | |
import abc | |
class Tokenizer(abc.ABC): | |
def encode(self, text: str, add_bos: bool, add_eos: bool): | |
pass | |
def decode(self, tokens: list[int]): | |
pass | |
def get_token_offsets( | |
self, text: str, tokens: list[int] | None = None | |
) -> tuple[list[str], list[int]]: | |
"""Return the offsets of the tokens in the original text. Only used for evaluation.""" | |
pass | |
def get_vocab_size(self) -> int: | |
pass | |