from vocab.glm_chinese import tokenizer print(tokenizer.decode([20])) vocab = tokenizer.get_vocab() print(vocab)