kotstantinovskii commited on
Commit
c57f5ec
1 Parent(s): 38aae15

Upload tokenizer.py

Browse files
Files changed (1) hide show
  1. tokenizer.py +7 -0
tokenizer.py ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ import streamlit as st
2
+ from transformers import DistilBertTokenizerFast
3
+
4
+
5
+ @st.cache(allow_output_mutation=True)
6
+ def get_tokenizer(num_labels=153):
7
+ return DistilBertTokenizerFast.from_pretrained('distilbert-base-uncased', num_labels=num_labels)