from vocab.chinese_llama2 import tokenizer encoding = tokenizer.encode("开始站位符试试") print(encoding)