Spaces:

spacy
/

healthsea-demo

Runtime error

App Files Files Community

edichief commited on Nov 29, 2021

Commit

2db6e66

•

1 Parent(s): 40351d8

Add more info and warnings

Browse files

Files changed (3) hide show

app.py +3 -6
visualize_dataset.py +9 -6
visualize_pipeline.py +10 -8

app.py CHANGED Viewed

@@ -15,17 +15,14 @@ intro.subheader("Create easier access to health✨")
 jellyfish.image("data/img/Jellymation.gif")
 intro.markdown(
-    "Healthsea is a spaCy v3 pipeline that analyzes user reviews to supplement products by extracting their effects on health."
 )
 intro.markdown(
-    """With this app, you're able to explore the results of Healthsea on up to 1 million reviews.
-    You can search for any health aspect, whether it's an disease (e.g. joint pain) or a desired health effect such as (e.g. energy),
-    the app returns a list of the best products and substances. You can also explore the pipeline itself, by writing custom reviews and
-    get an insight into the individual proccessing steps.
     """
 )
 intro.markdown(
-    """You can read more in our [blog post]().
     """
 )

 jellyfish.image("data/img/Jellymation.gif")
 intro.markdown(
+    "Healthsea is a spaCy v3 pipeline that analyzes user-generated reviews to supplementary products by extracting the effects on health stated by the reviewer."
 )
 intro.markdown(
+    """With this app, you're able to explore the pipeline and it's result on productive data. You can choose between two different apps `Visualize dataset` and `Visualize pipeline`
     """
 )
 intro.markdown(
+    """The code for Healthsea is provided in this [github repository](https://github.com/thomashacker/healthsea) and if you're interested you can read more about the project in our [blog post]().
     """
 )

visualize_dataset.py CHANGED Viewed

@@ -52,7 +52,10 @@ def visualize_dataset():
     # KPI
-    st.markdown("""This app presents the analyzed dataset of up to one million reviews. You can search for the best products and substances to any health aspect based on what reviewers wrote in their reviews.""")
     st.markdown("""---""")
@@ -70,10 +73,10 @@ def visualize_dataset():
     # Expander
     show_conditions, show_benefits = st.columns(2)
-    with show_conditions.expander("Top 1000 mentioned Conditions"):
         st.write(search_engine.get_all_conditions_df())
-    with show_benefits.expander("Top 1000 mentioned Benefits"):
         st.write(search_engine.get_all_benefits_df())
     st.markdown("""---""")
@@ -85,7 +88,7 @@ def visualize_dataset():
     st.markdown("""---""")
     st.markdown(central_text("🧃 Products"), unsafe_allow_html=True)
-    st.markdown("""The products are scored based on what reviewers say. Additional variables in the scoring function are product rating, helpful count and whether the review is considered 'fake'. """)
     # DataFrame
     st.write(search_engine.get_products_df(search, n))
@@ -115,7 +118,7 @@ def visualize_dataset():
             current_aspect = search_engine.get_aspect_meta(aspect)
             vectors.append((current_aspect["name"], current_aspect["vector"]))
         st.markdown("\n")
-        st.markdown("""To improve the search, the table also shows results of other health aspects with a high similarity""")
         st.write(search_engine.tsne_plot(vectors))
     else:
@@ -133,7 +136,7 @@ def visualize_dataset():
     # Substances
     st.markdown(central_text("🍯 Substances"), unsafe_allow_html=True)
-    st.markdown("""The scores of the substances are based on the products""")
     # DataFrame
     st.write(search_engine.get_substances_df(search, n))

     # KPI
+    st.info("""This app presents the analyzed dataset of up to one million reviews. You can search for the products and substances with the highest score based on health aspect. The score is based on what reviewers wrote in their reviews.""")
+    st.warning("""Please note that the results produced by Healthsea should not be used as a foundation for solving health problems neither do we want to advocate that supplement products are able to solve everyone's health issues.
+    Healthsea is a research project that presents a technical approach on analyzing user-generated reviews and acts as a proof-of-concept.""")
     st.markdown("""---""")
     # Expander
     show_conditions, show_benefits = st.columns(2)
+    with show_conditions.expander("Top mentioned Conditions"):
         st.write(search_engine.get_all_conditions_df())
+    with show_benefits.expander("Top mentioned Benefits"):
         st.write(search_engine.get_all_benefits_df())
     st.markdown("""---""")
     st.markdown("""---""")
     st.markdown(central_text("🧃 Products"), unsafe_allow_html=True)
+    st.info("""The products are scored based on what reviewers say. Additional variables in the scoring function are product rating, helpful count and whether the review is considered 'fake'. """)
     # DataFrame
     st.write(search_engine.get_products_df(search, n))
             current_aspect = search_engine.get_aspect_meta(aspect)
             vectors.append((current_aspect["name"], current_aspect["vector"]))
         st.markdown("\n")
+        st.info("""To improve the search, the table also shows results of other health aspects with a high similarity""")
         st.write(search_engine.tsne_plot(vectors))
     else:
     # Substances
     st.markdown(central_text("🍯 Substances"), unsafe_allow_html=True)
+    st.info("""The scores of the substances are based on the products""")
     # DataFrame
     st.write(search_engine.get_substances_df(search, n))

visualize_pipeline.py CHANGED Viewed

@@ -60,10 +60,10 @@ def visualize_pipeline():
         </div>"""
         return html
-    load_state = st.markdown ("#### Loading...")
     # Load model
     try:
-        load_state.markdown ("#### Loading model...")
         if "model" not in st.session_state:
             nlp = spacy.load("en_healthsea")
             st.session_state["model"] = nlp
@@ -72,15 +72,15 @@ def visualize_pipeline():
     except LookupError:
         import nltk
         import benepar
-        load_state.markdown ("#### Downloading model...")
         benepar.download('benepar_en3')
         if "model" not in st.session_state:
             nlp = spacy.load("en_healthsea")
             st.session_state["model"] = nlp
-    load_state.markdown ("#### Loading done!")
     # Pipeline
-    st.markdown("""This app visualizes the processing steps of the Healthsea pipeline. You can test it by writing an example review.""")
     st.markdown("""---""")
@@ -105,7 +105,7 @@ def visualize_pipeline():
         colors={"CONDITION": "#FF4B76", "BENEFIT": "#629B68"},
     )
-    st.markdown("""The first processing step is to identify Conditions or Benefits with Named Entity Recognition. Conditions are diseases, symptoms and general health problems (e.g. joint pain), while Benefits are positive desired health aspects (e.g. energy)""")
     st.markdown("""---""")
@@ -123,9 +123,11 @@ def visualize_pipeline():
         )
         st.markdown("\n")
-    st.markdown("""The review is segmented into sub-clauses and then classified by a Text Classification model. We additionally blind the found entities to improve generalization and also to inform the model about our current target entity of which we want to get the prediction of.
     The Text Classification predicts four exclusive classes: 'Positive', 'Negative', 'Neutral', 'Anamnesis', they represent the health effect.""")
     st.markdown("""---""")
     # Aggregation
@@ -141,7 +143,7 @@ def visualize_pipeline():
         )
         st.markdown("\n")
-    st.markdown("""Multiple classification are aggregated into one final classification.""")
     st.markdown("""---""")
     # Indepth

         </div>"""
         return html
+    load_state = st.info("Loading...")
     # Load model
     try:
+        load_state.info("Loading model...")
         if "model" not in st.session_state:
             nlp = spacy.load("en_healthsea")
             st.session_state["model"] = nlp
     except LookupError:
         import nltk
         import benepar
+        load_state.info ("Downloading model...")
         benepar.download('benepar_en3')
         if "model" not in st.session_state:
             nlp = spacy.load("en_healthsea")
             st.session_state["model"] = nlp
+    load_state.success ("Loading complete!")
     # Pipeline
+    st.info("""This app visualizes the processing steps of the Healthsea pipeline. You can test it by writing an example review.""")
     st.markdown("""---""")
         colors={"CONDITION": "#FF4B76", "BENEFIT": "#629B68"},
     )
+    st.info("""The first processing step is to identify Conditions or Benefits with Named Entity Recognition. Conditions are diseases, symptoms and general health problems (e.g. joint pain), while Benefits are positive desired health aspects (e.g. energy)""")
     st.markdown("""---""")
         )
         st.markdown("\n")
+    st.info("""The review is segmented into sub-clauses and then classified by a Text Classification model. We additionally blind the found entities to improve generalization and also to inform the model about our current target entity of which we want to get the prediction of.
     The Text Classification predicts four exclusive classes: 'Positive', 'Negative', 'Neutral', 'Anamnesis', they represent the health effect.""")
+    st.info("""The 'Anamnesis' class is defined as the current state of health of a reviewer (e.g. 'I am diagnosed with joint pain'). It is used to link stated health effects that are mentioned in later sentences.""")
     st.markdown("""---""")
     # Aggregation
         )
         st.markdown("\n")
+    st.info("""Multiple classification are aggregated into one final classification.""")
     st.markdown("""---""")
     # Indepth