csukuangfj's picture
add model files
50d6551
raw
history blame
No virus
741 Bytes
#!/usr/bin/env python3
import sys
from typing import Dict
def load_tokens():
ans = dict()
i = 0
with open("tokens.json", encoding="utf-8") as f:
for line in f:
line = line.strip()
if '[' in line: continue
if ']' in line: continue
if '"' in line and ',' in line:
line = line[1:-2]
ans[i] = line.strip()
i += 1
print('num tokens', i)
return ans
def write_tokens(tokens: Dict[int, str]):
with open("tokens.txt", "w", encoding="utf-8") as f:
for idx, s in tokens.items():
f.write(f"{s} {idx}\n")
def main():
tokens = load_tokens()
write_tokens(tokens)
if __name__ == "__main__":
main()