Spaces:

annalyzin
/

chinese_sentence_grading

Sleeping

Annalyn Ng commited on May 7, 2023

Commit

ecfe3e6

•

1 Parent(s): 93be2eb

add preprocessing to add mask

Files changed (1) hide show

app.py CHANGED Viewed

@@ -12,12 +12,18 @@ mask_token = tokenizer.mask_token
 text = f"雨天，我整个人就便{mask_token}了，不想出外，甚至不想去上课。"
 target_word = "懒惰"
 def eval_prob(target_word, text):
     # Get index of target_word
     idx = tokenizer.encode(target_word)[2]
     # Get logits
-    inputs = tokenizer(text, return_tensors="pt")
     token_logits = model(**inputs).logits
     # Find the location of the MASK and extract its logits
@@ -36,8 +42,8 @@ def eval_prob(target_word, text):
 gr.Interface(
     fn=eval_prob,
     inputs=[
-        gr.Textbox(placeholder="懒惰"),
-        gr.Textbox(placeholder=f"雨天，我整个人就便{mask_token}了，不想出外，甚至不想去上课。"),
     ],
     outputs="text",
     title="Chinese Sentence Grading",

 text = f"雨天，我整个人就便{mask_token}了，不想出外，甚至不想去上课。"
 target_word = "懒惰"
+def add_mask(target_word, text):
+     text_mask = text.replace(target_word, mask_token)
+     return text_mask
 def eval_prob(target_word, text):
+    text_mask = add_mask(target_word, text)
     # Get index of target_word
     idx = tokenizer.encode(target_word)[2]
     # Get logits
+    inputs = tokenizer(text_mask, return_tensors="pt")
     token_logits = model(**inputs).logits
     # Find the location of the MASK and extract its logits
 gr.Interface(
     fn=eval_prob,
     inputs=[
+        gr.Textbox(placeholder="夸大"),
+        gr.Textbox(placeholder=f"我们使用 Generative AI 已经很长时间了，所以他们最近的媒体报道可能被夸大了。"),
     ],
     outputs="text",
     title="Chinese Sentence Grading",