Spaces:

hamza50
/

paris-hotel-finder

Sleeping

hamza50 commited on Jan 27

Commit

a1c7ed3

•

1 Parent(s): 0bda70d

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -6,17 +6,16 @@
 @author: Hamza Farooq
 """
-import spacy
-from spacy.lang.en.stop_words import STOP_WORDS
 from string import punctuation
 from collections import Counter
 from heapq import nlargest
 import os
-nlp = spacy.load("en_core_web_sm")
 from sentence_transformers import SentenceTransformer, CrossEncoder, util
 import datetime
-from spacy import displacy
 import streamlit as st
 import matplotlib.pyplot as plt
 from wordcloud import WordCloud
@@ -180,18 +179,18 @@ def main():
         for token in text.lower().split():
             token = token.strip(string.punctuation)
-            if len(token) > 0 and token not in _stop_words.ENGLISH_STOP_WORDS:
                 tokenized_doc.append(token)
         return tokenized_doc
     def search(query):
         # q = [str(userinput)]
-        doc = nlp(str(userinput))
-        ent_html = displacy.render(doc, style="ent", jupyter=False)
 # Display the entity visualization in the browser:
-        st.markdown(ent_html, unsafe_allow_html=True)
         ##### BM25 search (lexical search) #####
         bm25_scores = bm25.get_scores(bm25_tokenizer(query))
         top_n = np.argpartition(bm25_scores, -5)[-5:]

 @author: Hamza Farooq
 """
 from string import punctuation
 from collections import Counter
 from heapq import nlargest
 import os
 from sentence_transformers import SentenceTransformer, CrossEncoder, util
 import datetime
 import streamlit as st
 import matplotlib.pyplot as plt
 from wordcloud import WordCloud
         for token in text.lower().split():
             token = token.strip(string.punctuation)
+            if len(token) > 0:
                 tokenized_doc.append(token)
         return tokenized_doc
     def search(query):
         # q = [str(userinput)]
+        # doc = nlp(str(userinput))
+        # ent_html = displacy.render(doc, style="ent", jupyter=False)
 # Display the entity visualization in the browser:
+        st.markdown(query, unsafe_allow_html=True)
         ##### BM25 search (lexical search) #####
         bm25_scores = bm25.get_scores(bm25_tokenizer(query))
         top_n = np.argpartition(bm25_scores, -5)[-5:]