Spaces:

shibing624
/

pycorrector

Running

App Files Files Community

shibing624 commited on Feb 14, 2022

Commit

fdab1ea

•

1 Parent(s): 04a455f

update demo.

Browse files

Files changed (1) hide show

app.py +15 -19

app.py CHANGED Viewed

@@ -7,9 +7,9 @@ tokenizer = BertTokenizer.from_pretrained("shibing624/macbert4csc-base-chinese")
 model = BertForMaskedLM.from_pretrained("shibing624/macbert4csc-base-chinese")
-def ai_text(texts):
     with torch.no_grad():
-        outputs = model(**tokenizer(texts, padding=True, return_tensors='pt'))
     def get_errors(corrected_text, origin_text):
         sub_details = []
@@ -29,30 +29,26 @@ def ai_text(texts):
         sub_details = sorted(sub_details, key=operator.itemgetter(2))
         return corrected_text, sub_details
-    result = []
-    for ids, text in zip(outputs.logits, texts):
-        _text = tokenizer.decode(torch.argmax(ids, dim=-1), skip_special_tokens=True).replace(' ', '')
-        corrected_text = _text[:len(text)]
-        corrected_text, details = get_errors(corrected_text, text)
-        print(text, ' => ', corrected_text, details)
-        result.append((corrected_text, details))
-    print(result)
-    return result
 if __name__ == '__main__':
-    print(ai_text(['少先队员因该为老人让坐']))
     examples = [
-        [['真麻烦你了。希望你们好好的跳无']],
-        [['少先队员因该为老人让坐']],
-        [['机七学习是人工智能领遇最能体现智能的一个分知']],
-        [['今天心情很好']],
-        [['他法语说的很好，的语也不错']],
-        [['他们的吵翻很不错，再说他们做的咖喱鸡也好吃']],
     ]
     output_text = gr.outputs.Textbox()
-    gr.Interface(ai_text, "textbox", output_text, title="Chinese Text Correction shibing624/macbert4csc-base-chinese",
                  description="Copy or input error Chinese text. Submit and the machine will correct text.",
                  examples=examples).launch()

 model = BertForMaskedLM.from_pretrained("shibing624/macbert4csc-base-chinese")
+def ai_text(text):
     with torch.no_grad():
+        outputs = model(**tokenizer(text, padding=True, return_tensors='pt'))
     def get_errors(corrected_text, origin_text):
         sub_details = []
         sub_details = sorted(sub_details, key=operator.itemgetter(2))
         return corrected_text, sub_details
+    _text = tokenizer.decode(torch.argmax(outputs.logits, dim=-1), skip_special_tokens=True).replace(' ', '')
+    corrected_text = _text[:len(text)]
+    corrected_text, details = get_errors(corrected_text, text)
+    print(text, ' => ', corrected_text, details)
+    return corrected_text, details
 if __name__ == '__main__':
+    print(ai_text('少先队员因该为老人让坐'))
     examples = [
+        ['真麻烦你了。希望你们好好的跳无'],
+        ['少先队员因该为老人让坐'],
+        ['机七学习是人工智能领遇最能体现智能的一个分知'],
+        ['今天心情很好'],
+        ['他法语说的很好，的语也不错'],
+        ['他们的吵翻很不错，再说他们做的咖喱鸡也好吃'],
     ]
     output_text = gr.outputs.Textbox()
+    gr.Interface(ai_text, "textbox", "textbox", title="Chinese Text Correction shibing624/macbert4csc-base-chinese",
                  description="Copy or input error Chinese text. Submit and the machine will correct text.",
                  examples=examples).launch()