Spaces:

taishi-i
/

awesome-japanese-nlp-resources-search

Running

App Files Files Community

taishi-i commited on Mar 25, 2023

Commit

94349ba

•

1 Parent(s): 1fdf118

Update app.py

Browse files

Files changed (1) hide show

app.py +95 -58

app.py CHANGED Viewed

@@ -3,61 +3,98 @@ import json
 import streamlit as st
 from pyserini.search.lucene import LuceneSearcher
-# Search engine
-searcher = LuceneSearcher("indexes/docs")
-searcher.set_language("ja")
-# UI
-st.set_page_config(
-    page_title="awesome-japanese-nlp-resources-search",
-    page_icon="😎",
-    layout="centered",
-)
-cola, colb, colc = st.columns([5, 4, 5])
-st.header("awesome-japanese-nlp-resources-search 😎")
-st.markdown(
-    "You can search for open-source software from [400+ Japanese NLP"
-    " repositories](https://github.com/taishi-i/awesome-japanese-nlp-resources)."
-)
-col1, col2 = st.columns([9, 1])
-with col1:
-    search_query = st.text_input(label="", placeholder="Search")
-with col2:
-    st.write("#")
-    button_clicked = st.button("🔎")
-if search_query or button_clicked:
-    search_results = searcher.search(search_query, k=100_000)
-    st.write(
-        '<p align="light" style="color:grey;">'
-        f" {len(search_results):,.0f} repositories </p>",
-        unsafe_allow_html=True,
-    )
-    for result in search_results:
-        data_json = json.loads(result.raw)
-        description = data_json["description"]
-        url = data_json["url"]
-        project_name = data_json["project_name"]
-        main_topic = data_json["main_topic"]
-        sub_topic = data_json["sub_topic"]
-        try:
-            st.markdown(f"### [{project_name}]({url})")
-            st.markdown(f"{description}")
-            if sub_topic is None:
-                st.text(f"{main_topic}")
-            else:
-                st.text(f"{main_topic} / {sub_topic}")
-            st.markdown("")
-            st.markdown("")
-        except:
-            pass

 import streamlit as st
 from pyserini.search.lucene import LuceneSearcher
+class SearchApplication:
+    def __init__(self):
+        self.title = "Awesome Japanese NLP resources search"
+        self.set_page_config()
+        self.searcher = self.set_searcher()
+        st.header(self.title)
+        col1, col2 = st.columns(2)
+        with col1:
+            self.query = st.text_input(
+                "Search English or Japanese words", value=""
+            )
+        with col2:
+            st.write("#")
+            self.search_button = st.button("🔎")
+        st.caption(
+            "You can search for open-source software from [400+ Japanese NLP"
+            " repositories](https://github.com/taishi-i/awesome-japanese-nlp-resources)."
+        )
+        st.write("#")
+        self.show_popular_words()
+        self.show_search_results()
+    def set_page_config(self):
+        st.set_page_config(
+            page_title=self.title,
+            page_icon="😎",
+            layout="centered",
+        )
+    def set_searcher(self):
+        searcher = LuceneSearcher("indexes/docs")
+        searcher.set_language("ja")
+        return searcher
+    def show_popular_words(self):
+        st.caption("Popular words")
+        word1, word2, word3, word4, _ = st.columns(5)
+        with word1:
+            button1 = st.button("Python")
+            if button1:
+                self.query = "Python"
+        with word2:
+            button2 = st.button("BERT")
+            if button2:
+                self.query = "BERT"
+        with word3:
+            button3 = st.button("辞書")
+            if button3:
+                self.query = "辞書"
+        with word4:
+            button4 = st.button("コーパス")
+            if button4:
+                self.query = "Corpus"
+    def show_search_results(self):
+        if self.query or self.search_button:
+            st.write("#")
+            search_results = self.searcher.search(self.query, k=500)
+            num_search_results = len(search_results)
+            st.write(f"{num_search_results} results")
+            for result in search_results:
+                data_json = json.loads(result.raw)
+                description = data_json["description"]
+                url = data_json["url"]
+                project_name = data_json["project_name"]
+                main_topic = data_json["main_topic"]
+                sub_topic = data_json["sub_topic"]
+                st.subheader(f"[{project_name}]({url})")
+                st.markdown(description)
+                if sub_topic is None:
+                    st.caption(f"{main_topic}")
+                else:
+                    st.caption(f"{main_topic} / {sub_topic}")
+                st.write("#")
+def main():
+    SearchApplication()
+if __name__ == "__main__":
+    main()