Spaces:

ki33elev
/

Transformer_arxiv_classification

Runtime error

ki33elev commited on Mar 26, 2022

Commit

62096a0

•

1 Parent(s): 41e544a

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -18,6 +18,8 @@ def load_model():
 @st.cache(suppress_st_warning=True, hash_funcs={tokenizers.Tokenizer: lambda _: None})
 def predict(title, summary, tokenizer, model):
     text = title + "\n" + summary
     tokens = tokenizer.encode(text)
     with torch.no_grad():
         logits = model(torch.as_tensor([tokens]))[0]
@@ -38,7 +40,7 @@ def predict(title, summary, tokenizer, model):
 @st.cache(suppress_st_warning=True)
 def get_results(prediction, prediction_probs):
-    frame =  pd.DataFrame({'Topic': prediction, 'Confidence': prediction_probs})
     frame.index = np.arange(1, len(frame) + 1)
     return frame
@@ -47,7 +49,7 @@ label_to_theme = {0: 'Computer science', 1: 'Economics', 2: 'Electrical Engineer
 st.title("Arxiv articles classification")
 st.markdown("<h1 style='text-align: center;'><img width=300px src='https://media.wired.com/photos/592700e3cfe0d93c474320f1/191:100/w_1200,h_630,c_limit/faces-icon.jpg'>", unsafe_allow_html=True)
-st.markdown("This is an interface that can determine the article's topic based on its title and summary. Though it can work with title only, it is recommended that you provide summary if possible - this will result in a better prediction quality.")
 tokenizer, model = load_model()
@@ -58,5 +60,8 @@ button = st.button('Run')
 if button:
     prediction, prediction_probs = predict(title, summary, tokenizer, model)
     ans = get_results(prediction, prediction_probs)
-    st.subheader('Results:')
-    st.write(ans)

 @st.cache(suppress_st_warning=True, hash_funcs={tokenizers.Tokenizer: lambda _: None})
 def predict(title, summary, tokenizer, model):
     text = title + "\n" + summary
+    if len(text) < 20:
+        return 'error'
     tokens = tokenizer.encode(text)
     with torch.no_grad():
         logits = model(torch.as_tensor([tokens]))[0]
 @st.cache(suppress_st_warning=True)
 def get_results(prediction, prediction_probs):
+    frame =  pd.DataFrame({'Category': prediction, 'Confidence': prediction_probs})
     frame.index = np.arange(1, len(frame) + 1)
     return frame
 st.title("Arxiv articles classification")
 st.markdown("<h1 style='text-align: center;'><img width=300px src='https://media.wired.com/photos/592700e3cfe0d93c474320f1/191:100/w_1200,h_630,c_limit/faces-icon.jpg'>", unsafe_allow_html=True)
+st.markdown("This is an interface that can determine the article's category based on its title and summary. Though it can work with title only, it is recommended that you provide summary if possible - this will result in a better prediction quality.")
 tokenizer, model = load_model()
 if button:
     prediction, prediction_probs = predict(title, summary, tokenizer, model)
     ans = get_results(prediction, prediction_probs)
+    if ans == 'error':
+        st.error("Your input is too short. It is probably not a real article, please try again.")
+    else:
+        st.subheader('Results:')
+        st.write(ans)