File size: 569 Bytes
749745d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
from .simple_tokenizer import SimpleTokenizer


def build_tokenizer(tokenizer_name):
    tokenizer = None
    if tokenizer_name == "clip":
        tokenizer = SimpleTokenizer()
    elif "hf_" in tokenizer_name:
        from .hfpt_tokenizer import HFPTTokenizer

        tokenizer = HFPTTokenizer(pt_name=tokenizer_name[3:])
    elif "hfc_" in tokenizer_name:
        from .hfpt_tokenizer import HFPTTokenizer

        tokenizer = HFPTTokenizer(pt_name=tokenizer_name[4:])
    else:
        raise ValueError("Unknown tokenizer")

    return tokenizer