Spaces:

nneka
/

MemorySupportChatbot

Build error

App Files Files Community

nneka commited on Mar 9

Commit

d091a7a

•

1 Parent(s): bf8b87a

Upload streamlit_app.py

Browse files

Files changed (1) hide show

streamlit_app.py +111 -0

streamlit_app.py ADDED Viewed

	@@ -0,0 +1,111 @@

+# Import necessary libraries
+import streamlit as st
+from transformers import GPT2Tokenizer, GPT2LMHeadModel
+from wordcloud import WordCloud
+import matplotlib.pyplot as plt
+import pandas as pd
+import nltk
+from nltk.corpus import stopwords
+from nltk.tokenize import word_tokenize
+# Download NLTK resources if not already downloaded
+try:
+    nltk.data.find('tokenizers/punkt')
+    nltk.data.find('corpora/stopwords')
+    nltk.data.find('sentiment/vader_lexicon')
+except LookupError:
+    nltk.download('punkt')
+    nltk.download('stopwords')
+    nltk.download('vader_lexicon')
+# Load GPT-2 tokenizer and model
+tokenizer = GPT2Tokenizer.from_pretrained('gpt2')
+model = GPT2LMHeadModel.from_pretrained('gpt2')
+# Load and preprocess data
+# Assuming df is a DataFrame containing the cleaned text
+# Make sure df is defined or loaded correctly before using it in Streamlit components
+txt_files = [
+    "Cognition in Pregnancy- Perceptions and Performance, 2005-2006 - Dataset - B2FIND.txt",
+    "Frontiers | Cognitive disorder and associated factors among pregnant women attending antenatal servi.txt",
+    "Frustrated By Brain Fog? How Pregnancy Actually Alters Yo....txt",
+    "Is Pregnancy Brain Real?.txt",
+    "Is ‘pregnancy brain’ real or just a myth? | Your Pregnancy Matters | UT Southwestern Medical Center.txt",
+    "Memory and affective changes during the antepartum- A narrative review and integrative hypothesis- J.txt",
+    "Pregnancy 'does cause memory loss' | Medical research | The Guardian.txt",
+    "Pregnancy Brain — Forgetfulness During Pregnancy.txt",
+    "Pregnancy brain- When it starts and what causes pregnancy brain fog | BabyCenter.txt",
+    "Pregnancy does cause memory loss, study says - CNN.txt",
+    "Textbook J.A. Russell, A.J. Douglas, R.J. Windle, C.D. Ingram - The Maternal Brain_ Neurobiological and Neuroendocrine Adaptation and Disorders in Pregnancy & Post Partum-Elsevier Science (2001).txt",
+    "The effect of pregnancy on maternal cognition - PMC.txt",
+    "This Is Your Brain on Motherhood - The New York Times.txt",
+    "Working memory from pregnancy to postpartum.txt",
+    "What Is Mom Brain and Is It Real?.txt",
+    "Memory loss in Pregnancy- Myth or Fact? - International Forum for Wellbeing in Pregnancy.txt",
+    "Memory and mood changes in pregnancy- a qualitative content analysis of women’s first-hand accounts.txt",
+    "Is Mom Brain real? Understanding and coping with postpartum brain fog.txt",
+    "Everyday Life Memory Deficits in Pregnant Women.txt",
+    "Cognitive Function Decline in the Third Trimester.txt",
+    "'Mommy brain' might be a good thing, new research suggests | CBC Radio.txt"
+]
+data = []
+for file_path in txt_files:
+    with open(file_path, "r") as file:
+        text = file.read()
+        data.append({"text": text})
+df = pd.DataFrame(data)
+# Cleaning the text
+nltk.download('punkt')  # Download the 'punkt' tokenizer models for tokenization
+df['tokens'] = df['text'].apply(word_tokenize) # Tokenize each text in the 'text' column into a list of words
+nltk.download('stopwords')  # Download the stopwords corpus for English
+stop_words = set(stopwords.words('english'))  # Load the English stopwords into a set
+df['cleaned_text'] = df['tokens'].apply(lambda x: [word.lower() for word in x if (word.isalnum() and word.lower() not in stop_words)])
+df['cleaned_text'] = df['cleaned_text'].apply(lambda x: ' '.join(x))
+# Streamlit app
+st.title("Memory Support Chatbox for Pregnant Women")
+user_input = st.text_input("You:", "Enter your message here...")
+if user_input:
+    input_ids = tokenizer.encode(user_input, return_tensors='pt')
+    reply_ids = model.generate(input_ids, max_length=100, pad_token_id=tokenizer.eos_token_id)
+    reply_text = tokenizer.decode(reply_ids[0], skip_special_tokens=True)
+    st.text_area("Chatbot:", value=reply_text, height=200)
+# Text Analysis
+st.subheader("Text Analysis")
+# Word Cloud
+st.subheader("Word Cloud")
+all_text = " ".join(df["cleaned_text"])
+wordcloud = WordCloud(width=800, height=400, background_color="white").generate(all_text)
+plt.figure(figsize=(10, 5))
+plt.imshow(wordcloud, interpolation="bilinear")
+plt.axis("off")
+st.pyplot(plt)
+# Sample Prompts
+st.subheader("Sample Prompts")
+sample_prompts = [
+    "What causes pregnancy brain fog?",
+    "How does pregnancy affect the brain?",
+    "How can I improve my memory during pregnancy?",
+    "Can pregnancy brain fog affect my ability to work or perform daily tasks?",
+]
+for prompt in sample_prompts:
+    input_ids = tokenizer.encode(prompt, return_tensors='pt')
+    output = model.generate(input_ids, max_length=100, num_return_sequences=1, pad_token_id=tokenizer.eos_token_id, attention_mask=input_ids.ne(tokenizer.eos_token_id))
+    response = tokenizer.decode(output[0], skip_special_tokens=True)
+    st.write(f"**Prompt:** {prompt}\n**Response:** {response}\n")
+# Displaying DataFrame
+st.subheader("DataFrame")
+st.write(df)