DPLM-650M / base_tokenizer.py
lhallee's picture
Upload base_tokenizer.py with huggingface_hub
2193303 verified
raw
history blame contribute delete
255 Bytes
from transformers import PreTrainedTokenizerBase
class BaseSequenceTokenizer:
def __init__(self, tokenizer: PreTrainedTokenizerBase):
self.tokenizer = tokenizer
def __call__(self, sequences, **kwargs):
raise NotImplementedError