Spaces:

curtpond
/

mle10-glg-demo

Sleeping

curtpond commited on Feb 11, 2023

Commit

0f34ca3

1 Parent(s): 8d08fb9

Added preprocessing steps to app.py.

Files changed (1) hide show

app.py CHANGED Viewed

@@ -2,14 +2,38 @@
 import gradio as gr
 from sklearn.linear_model import LogisticRegression
 import pickle5 as pickle
 # file name
 lr_filename = 'logistic_regression.pkl'
 # Load model from pickle file
 model = pickle.load(open(lr_filename, 'rb'))
-# Define function to make a prediction with the model
 def predict(text):
     return model.predict([text])

 import gradio as gr
 from sklearn.linear_model import LogisticRegression
 import pickle5 as pickle
+import re
+import string
+import nltk
+import re
+from nltk.corpus import stopwords
+nltk.download('stopwords')
+from sklearn.feature_extraction.text import CountVectorizer
 # file name
 lr_filename = 'logistic_regression.pkl'
+# Process input text, including removing stopwords, converting to lowercase, and removing punctuation
+def process_text(text):
+    text = stopwords.words('english')
+    text = str(text).lower()
+    text = re.sub(
+        f"[{re.escape(string.punctuation)}]", " ", text
+    )
+    text = " ".join(text.split())
+    return text
+# Vectorize input text
+vectorizer = CountVectorizer()
+def vectorize_text(text):
+    text = process_text(text)
+    text = [text]
+    return vectorizer.transform(text)
 # Load model from pickle file
 model = pickle.load(open(lr_filename, 'rb'))
 def predict(text):
     return model.predict([text])