DPLM-3B / base_tokenizer.py
lhallee's picture
Upload base_tokenizer.py with huggingface_hub
fd3769e verified
raw
history blame contribute delete
255 Bytes
from transformers import PreTrainedTokenizerBase
class BaseSequenceTokenizer:
def __init__(self, tokenizer: PreTrainedTokenizerBase):
self.tokenizer = tokenizer
def __call__(self, sequences, **kwargs):
raise NotImplementedError