codebyzeb's picture
Upload tokenizer
127dad2 verified
raw
history blame contribute delete
424 Bytes
{"UNK":0,"PAD":1,"WORD_BOUNDARY":2,"UTT_BOUNDARY":3,"j":4,"ɛ":5,"h":6,"k":7,"ɑ":8,"m":9,"p":10,"aʊ":11,"n":12,"d":13,"z":14,"θ":15,"ɪ":16,"ŋ":17,"l":18,"aɪ":19,"s":20,"ɜː":21,"t":22,"w":23,"v":24,"ð":25,"æ":26,"ɔ":27,"ɹ":28,"ʌ":29,"f":30,"ə":31,"b":32,"iː":33,"eɪ":34,"oʊ":35,"d̠ʒ":36,"i":37,"uː":38,"iə":39,"ʊ":40,"ɡ":41,"t̠ʃ":42,"ɔɪ":43,"ʃ":44,"ʒ":45,"r":46,"x":47,"ɬ":48,"ɑ̃":49,"nʲ":50}