Spaces:

prosekutor
/

sentiment-analysis

Running

App Files Files Community

prosekutor commited on Sep 28, 2022

Commit

d799ebd

1 Parent(s): 2d7e826

added application files

Browse files

Files changed (3) hide show

app.py +68 -0
models/model_v1.pkl +3 -0
models/transformer_v1.pkl +3 -0

app.py ADDED Viewed

	@@ -0,0 +1,68 @@

+import gradio as gr
+import joblib as jb
+import re
+import string
+from nltk.corpus import stopwords
+from nltk.tokenize import word_tokenize
+from nltk.stem import PorterStemmer, WordNetLemmatizer
+import nltk
+nltk.download('stopwords')
+stop_words = set(stopwords.words('english'))
+cv = jb.load('.//models//transformer_v1.pkl')
+model = jb.load('.//models//model_v1.pkl')
+def preprocess_text(text):
+    """
+    Runs a set of transformational steps to
+    preprocess the text of the tweet.
+    """
+    # convert all text to lower case
+    text = text.lower()
+    # remove any urls
+    text = re.sub(r'http\S+|www\S+|https\S+', "", text, flags=re.MULTILINE)
+    # replace '****' with 'curse'
+    text = re.sub(r'\*\*\*\*', "gaali", text)
+    # remove punctuations
+    text = text.translate(str.maketrans("", "", string.punctuation))
+    # remove user @ references and hashtags
+    text = re.sub(r'\@\w+|\#', "", text)
+    # remove useless characters
+    text = re.sub(r'[^ -~]', '', text)
+    # remove stopwords
+    tweet_tokens = word_tokenize(text)
+    filtered_words = [word for word in tweet_tokens if word not in stop_words]
+    # stemming
+    ps = PorterStemmer()
+    stemmed_words = [ps.stem(w) for w in filtered_words]
+    # lemmatizing
+    lemmatizer = WordNetLemmatizer()
+    lemma_words = [lemmatizer.lemmatize(w, pos='a') for w in stemmed_words]
+    return ' '.join(lemma_words)
+def sentiment_analysis(text):
+    print(text)
+    text = cv.transform([preprocess_text(text)])
+    pred_prob = model.predict_proba(text)[0]
+    output = {"Negative": float(pred_prob[0]), "Neutral": float(pred_prob[1]), "Positive": float(pred_prob[2])}
+    print(output)
+    return output
+demo = gr.Interface(
+    fn=sentiment_analysis,
+    inputs=gr.Textbox(label="Input here", lines=2, placeholder="Input your text"),
+    outputs=gr.Label(label="Sentiment Analysis"),
+)
+demo.launch()

models/model_v1.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:28b989f2dec37cb7615dee7d299189decf1d15647fa92e1e9b6f38966a994449
+size 419236163

models/transformer_v1.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9fb9484ac5da542395636d3f2bed85ee06109f66eb4923d11bc0da05218a8357
+size 232123