Spaces:

kkesarwani
/

SentimentAnalysis

Sleeping

App Files Files Community

kkesarwani commited on Mar 19, 2024

Commit

1a44e19

1 Parent(s): faabc3a

gru model for sentiment analysis

Browse files

Files changed (8) hide show

.DS_Store +0 -0
.gitattributes +1 -0
app.py +55 -0
examples.txt +4 -0
helper_functions.py +68 -0
label_names.txt +4 -0
models/gru_model.keras +3 -0
requirements.txt +138 -0

.DS_Store ADDED Viewed

Binary file (6.15 kB). View file

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+*.keras filter=lfs diff=lfs merge=lfs -text

app.py ADDED Viewed

	@@ -0,0 +1,55 @@

+import gradio as gr
+import tensorflow as tf
+from sklearn.preprocessing import LabelEncoder
+import spacy
+from timeit import default_timer as timer
+from helper_functions import preprocess_single_sentence
+with open('label_names.txt', 'r') as f:
+    labels = [emotion.strip() for emotion in f.readlines()]
+with open('examples.txt', 'r') as f:
+    example_list = [example.strip() for example in f.readlines()]
+encoder= LabelEncoder()
+encoder.fit(labels)
+nlp = spacy.load("en_core_web_sm")
+model = tf.keras.models.load_model('models/gru_model.keras')
+def make_predictions(text):
+    """
+    Make predictions on the given text using the trained model.
+    Args:
+        text (str): The text to make predictions on.
+    Returns:
+        list: A list of predictions.
+    """
+    text= preprocess_single_sentence(text)
+    text= tf.expand_dims(text, 0)
+    start_time= timer()
+    probability = model.predict(text)
+    pred_label_with_prob= {labels[i]: float(probability[0][i]) for i in range(len(labels))}
+    pred_time = round(timer() - start_time, 5)
+    return pred_label_with_prob, pred_time
+input= gr.Textbox(lines=5, label="Enter text", placeholder="i like to have the same breathless feeling as a reader eager to see what will happen next")
+outputs=[
+        gr.Label(num_top_classes=len(labels), label="Predictions"),
+        gr.Number(label="Prediction time (s)"),
+    ]
+title= ' Sentiment Analysis 🤣😱😡😢 '
+description= 'The sentiment analysis model is a deep learning-based natural language processing (NLP) model designed to analyze and classify the sentiment expressed in text data. It is trained to understand the emotional tone of text and categorize it into predefined sentiment categories such as <b>anger, fear, saddness and joy.<b>'
+demo= gr.Interface(fn=make_predictions,
+                   inputs=input,
+                   outputs=outputs,
+                   title=title,
+                   description=description,
+                   examples= example_list
+                  )
+demo.launch()

examples.txt ADDED Viewed

	@@ -0,0 +1,4 @@

+im feeling rather rotten so im not very ambitious right now
+i left with my bouquet of red and yellow tulips under my arm feeling slightly more optimistic than when i arrived
+i cant walk into a shop anywhere where i do not feel uncomfortable
+i felt anger when at the end of a telephone call

helper_functions.py ADDED Viewed

	@@ -0,0 +1,68 @@

+import pandas as pd
+import matplotlib.pyplot as plt
+import seaborn as sns
+from sklearn.preprocessing import LabelEncoder
+import spacy
+with open('label_names.txt', 'r') as f:
+    labels = [emotion.strip() for emotion in f.readlines()]
+encoder= LabelEncoder()
+encoder.fit(labels)
+nlp = spacy.load("en_core_web_sm")
+def plot_pie_chart(data_frame: pd.DataFrame, title: str) -> None:
+    """
+    Plot a pie chart to visualize label distribution in the provided DataFrame.
+    Args:
+        data_frame (pd.DataFrame): The DataFrame containing the data to visualize.
+        title (str): The title for the pie chart.
+    Returns:
+        None
+    """
+    label_count = data_frame['label'].value_counts()
+    plt.figure(figsize=(8, 8))
+    sns.set_style("whitegrid")
+    plt.pie(label_count, labels=label_count.index, colors=sns.color_palette("hls", len(label_count.index)), autopct='%1.1f%%', startangle=90)
+    plt.title(f"{title} Label Distribution")
+    plt.show()
+    plt.close()
+def preprocess_text(df: pd.DataFrame, emotions: list=['love', 'surprise']):
+    """
+    Preprocesses text data in a DataFrame.
+    Args:
+        df (pd.DataFrame): DataFrame containing 'sentence' and 'label' columns.
+        encoder (LabelEncoder): Label encoder for the labels.
+        emotions (list): List of emotions to drop from the DataFrame.
+    Returns:
+        pd.DataFrame: DataFrame with preprocessed text and encoded labels.
+    """
+    for i in emotions:
+        df = df[df['label'] != i]
+    df['processed_text'] = df['text'].apply(lambda x: ' '.join([token.lemma_ for token in nlp(x) if not token.is_stop and not token.is_punct and not token.is_space]))
+    df['label_num'] = encoder.transform(df['label'])
+    df.drop(columns=['text', 'label'], inplace=True)
+    return df
+def preprocess_single_sentence(sentence):
+    """
+    Preprocesses a single sentence.
+    Args:
+        sentence (str): Input sentence.
+    Returns:
+        str: Preprocessed and tokenized sentence.
+    """
+    processed_text = ' '.join([token.lemma_ for token in nlp(sentence) if not token.is_stop and not token.is_punct and not token.is_space])
+    return processed_text

label_names.txt ADDED Viewed

	@@ -0,0 +1,4 @@

+joy
+sadness
+fear
+anger

models/gru_model.keras ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5e1e9d49645ff672edec9f35fd19857b9143b0e9295d759886bbb50f7cfdba0d
+size 9241147

requirements.txt ADDED Viewed

	@@ -0,0 +1,138 @@

+absl-py==2.1.0
+aiofiles==23.2.1
+altair==5.2.0
+annotated-types==0.6.0
+anyio==4.3.0
+appnope==0.1.4
+asttokens==2.4.1
+astunparse==1.6.3
+attrs==23.2.0
+blis==0.7.11
+catalogue==2.0.10
+certifi==2024.2.2
+charset-normalizer==3.3.2
+click==8.1.7
+cloudpathlib==0.16.0
+colorama==0.4.6
+comm==0.2.2
+confection==0.1.4
+contourpy==1.2.0
+cycler==0.12.1
+cymem==2.0.8
+debugpy==1.8.1
+decorator==5.1.1
+en-core-web-sm @ https://github.com/explosion/spacy-models/releases/download/en_core_web_sm-3.7.1/en_core_web_sm-3.7.1-py3-none-any.whl#sha256=86cc141f63942d4b2c5fcee06630fd6f904788d2f0ab005cce45aadb8fb73889
+exceptiongroup==1.2.0
+executing==2.0.1
+fastapi==0.110.0
+ffmpy==0.3.2
+filelock==3.13.1
+flatbuffers==24.3.7
+fonttools==4.50.0
+fsspec==2024.3.1
+gast==0.5.4
+google-pasta==0.2.0
+gradio==4.21.0
+gradio_client==0.12.0
+grpcio==1.62.1
+h11==0.14.0
+h5py==3.10.0
+httpcore==1.0.4
+httpx==0.27.0
+huggingface-hub==0.21.4
+idna==3.6
+importlib_metadata==7.0.2
+importlib_resources==6.3.1
+ipykernel==6.29.3
+ipython==8.18.1
+jedi==0.19.1
+Jinja2==3.1.3
+joblib==1.3.2
+jsonschema==4.21.1
+jsonschema-specifications==2023.12.1
+jupyter_client==8.6.1
+jupyter_core==5.7.2
+keras==3.1.0
+kiwisolver==1.4.5
+langcodes==3.3.0
+libclang==18.1.1
+Markdown==3.6
+markdown-it-py==3.0.0
+MarkupSafe==2.1.5
+matplotlib==3.8.3
+matplotlib-inline==0.1.6
+mdurl==0.1.2
+ml-dtypes==0.3.2
+murmurhash==1.0.10
+namex==0.0.7
+nest-asyncio==1.6.0
+numpy==1.26.4
+opt-einsum==3.3.0
+optree==0.10.0
+orjson==3.9.15
+packaging==24.0
+pandas==2.2.1
+parso==0.8.3
+pexpect==4.9.0
+pillow==10.2.0
+platformdirs==4.2.0
+preshed==3.0.9
+prompt-toolkit==3.0.43
+protobuf==4.25.3
+psutil==5.9.8
+ptyprocess==0.7.0
+pure-eval==0.2.2
+pydantic==2.6.4
+pydantic_core==2.16.3
+pydub==0.25.1
+Pygments==2.17.2
+pyparsing==3.1.2
+python-dateutil==2.9.0.post0
+python-multipart==0.0.9
+pytz==2024.1
+PyYAML==6.0.1
+pyzmq==25.1.2
+referencing==0.34.0
+requests==2.31.0
+rich==13.7.1
+rpds-py==0.18.0
+ruff==0.3.3
+scikit-learn==1.4.1.post1
+scipy==1.12.0
+seaborn==0.13.2
+semantic-version==2.10.0
+shellingham==1.5.4
+six==1.16.0
+smart-open==6.4.0
+sniffio==1.3.1
+spacy==3.7.4
+spacy-legacy==3.0.12
+spacy-loggers==1.0.5
+srsly==2.4.8
+stack-data==0.6.3
+starlette==0.36.3
+tensorboard==2.16.2
+tensorboard-data-server==0.7.2
+tensorflow==2.16.1
+tensorflow-io-gcs-filesystem==0.36.0
+termcolor==2.4.0
+thinc==8.2.3
+threadpoolctl==3.3.0
+tomlkit==0.12.0
+toolz==0.12.1
+tornado==6.4
+tqdm==4.66.2
+traitlets==5.14.2
+typer==0.9.0
+typing_extensions==4.10.0
+tzdata==2024.1
+urllib3==2.2.1
+uvicorn==0.28.1
+wasabi==1.1.2
+wcwidth==0.2.13
+weasel==0.3.4
+websockets==11.0.3
+Werkzeug==3.0.1
+wordcloud==1.9.3
+wrapt==1.16.0
+zipp==3.18.1