taishi-i commited on
Commit
650b6f6
β€’
1 Parent(s): ec98b0b

update app.py

Browse files
app.py CHANGED
@@ -2,37 +2,41 @@ import json
2
 
3
  import gradio as gr
4
  import pandas as pd
5
- from pyserini.search.lucene import LuceneSearcher
6
 
7
- searcher = LuceneSearcher("indexes/docs")
8
- searcher.set_language("ja")
9
 
 
 
 
 
10
 
11
- def show_search_results(query):
12
- search_results = searcher.search(query, k=100)
13
 
14
- data = {"project_name": [], "description": []}
15
- for result in search_results:
16
- docid = result.docid
17
- doc = searcher.doc(docid)
18
- data_json = json.loads(doc.raw())
 
 
 
 
 
 
 
19
 
20
- url = data_json["url"]
21
- description = data_json["description"]
22
- project_name = data_json["project_name"]
23
 
24
- data["project_name"].append(f"[{project_name}]({url})")
25
- data["description"].append(description)
26
 
27
- data = pd.DataFrame(data)
28
- return data
 
 
29
 
30
 
31
  with gr.Blocks() as demo:
32
  gr.Markdown(
33
  """
34
  # Awesome Japanese NLP resources search πŸ”Ž
35
- You can search for open-source software from [500+ Japanese NLP repositories](https://github.com/taishi-i/awesome-japanese-nlp-resources).
36
  """
37
  )
38
 
 
2
 
3
  import gradio as gr
4
  import pandas as pd
 
5
 
 
 
6
 
7
+ def read_json(file_name):
8
+ with open(file_name, "r") as f:
9
+ json_data = json.load(f)
10
+ return json_data
11
 
 
 
12
 
13
+ json_file = "awesome-japanese-nlp-resources-search.json"
14
+ json_data = read_json(json_file)
15
+ data = {"project_name": [], "source": [], "description": []}
16
+
17
+ for data_json in json_data:
18
+ url = data_json["url"]
19
+ description = data_json["description"]
20
+ project_name = data_json["project_name"]
21
+ source = data_json["source"]
22
+ data["project_name"].append(f"[{project_name}]({url})")
23
+ data["source"].append(source)
24
+ data["description"].append(description)
25
 
26
+ data = pd.DataFrame(data)
 
 
27
 
 
 
28
 
29
+ def show_search_results(query):
30
+ contained = data["description"].str.contains(query)
31
+ df_search = data[contained]
32
+ return df_search
33
 
34
 
35
  with gr.Blocks() as demo:
36
  gr.Markdown(
37
  """
38
  # Awesome Japanese NLP resources search πŸ”Ž
39
+ You can search for open-source software from [1000+ Japanese NLP repositories](https://github.com/taishi-i/awesome-japanese-nlp-resources).
40
  """
41
  )
42
 
awesome-japanese-nlp-resources-search.json ADDED
The diff for this file is too large to render. See raw diff
 
packages.txt DELETED
@@ -1 +0,0 @@
1
- default-jdk
 
 
requirements.txt CHANGED
@@ -1,4 +1 @@
1
- pyserini
2
- faiss-cpu
3
- torch
4
- altair<5
 
1
+ pandas