mathtext-fastapi

Runtime error

Greg Thompson commited on Apr 20, 2023

Commit

b5b1714

1 Parent(s): b1bbf8f

Update keyword matching to work with phrases

Files changed (1) hide show

mathtext_fastapi/nlu.py CHANGED Viewed

@@ -1,9 +1,12 @@
 from collections.abc import Mapping
 from logging import getLogger
 import datetime as dt
 from dateutil.parser import isoparse
 from fuzzywuzzy import fuzz
 from mathtext_fastapi.intent_classification import predict_message_intent
 from mathtext_fastapi.logging import prepare_message_data_for_logging
 from mathtext.sentiment import sentiment
@@ -118,10 +121,10 @@ def run_intent_classification(message_text):
     >>> run_intent_classification("hardier")
     {'type': 'intent', 'data': 'harder', 'confidence': 0.92}
     """
-    label = ''
     ratio = 0
     nlu_response = {'type': 'intent', 'data': label, 'confidence': ratio}
-    commands = [
         'easier',
         'exit',
         'harder',
@@ -141,15 +144,22 @@ def run_intent_classification(message_text):
         'skip',
         'menu'
     ]
-    for command in commands:
         try:
-            ratio = fuzz.ratio(command, message_text.lower())
         except:
-            ratio = 0
-        if ratio > 80:
-            nlu_response['data'] = command
-            nlu_response['confidence'] = ratio / 100
     return nlu_response

+import re
 from collections.abc import Mapping
 from logging import getLogger
 import datetime as dt
 from dateutil.parser import isoparse
 from fuzzywuzzy import fuzz
+from fuzzywuzzy import process
 from mathtext_fastapi.intent_classification import predict_message_intent
 from mathtext_fastapi.logging import prepare_message_data_for_logging
 from mathtext.sentiment import sentiment
     >>> run_intent_classification("hardier")
     {'type': 'intent', 'data': 'harder', 'confidence': 0.92}
     """
+    label = 'no_match'
     ratio = 0
     nlu_response = {'type': 'intent', 'data': label, 'confidence': ratio}
+    keywords = [
         'easier',
         'exit',
         'harder',
         'skip',
         'menu'
     ]
+    try:
+        tokens = re.findall(r"[-a-zA-Z'_]+", message_text.lower())
+    except AttributeError:
+        tokens = ''
+    for keyword in keywords:
         try:
+            tok, score = process.extractOne(keyword, tokens, scorer=fuzz.ratio)
         except:
+            score = 0
+        if score > 80:
+            print(f"TOK: {tok}, SCORE: {score}")
+            nlu_response['data'] = keyword
+            nlu_response['confidence'] = score
     return nlu_response