madoss commited on
Commit
2014880
1 Parent(s): 7fc6e0e

Upload app.py

Browse files
Files changed (1) hide show
  1. app.py +43 -0
app.py ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import gradio as gr
2
+ import os
3
+ import query_index
4
+ import datasets
5
+ import sentence_transformers
6
+
7
+ def query(text, k=5):
8
+ model = sentence_transformers.SentenceTransformer(
9
+ "dangvantuan/sentence-camembert-large", device="cpu")
10
+
11
+ dataset = datasets.load_dataset("json", data_files=["./data/dataset.json"], split="train")
12
+ dataset.load_faiss_index("embeddings", "index.faiss")
13
+
14
+ query_embedding = model.encode(text)
15
+ _, retrieved_examples = dataset.get_nearest_examples(
16
+ "embeddings",
17
+ query_embedding,
18
+ k=k,
19
+ )
20
+
21
+
22
+ for text, start, end, title, url in zip(
23
+ retrieved_examples["text"],
24
+ retrieved_examples["start"],
25
+ retrieved_examples["end"],
26
+ retrieved_examples["title"],
27
+ retrieved_examples["url"],
28
+ ):
29
+ start = start
30
+ end = end
31
+ print(f"title: {title}")
32
+ print(f"transcript: [{str(start)+' ====> '+str(end)}] {text}")
33
+ print(f"link: {url}")
34
+ print("*" * 10)
35
+
36
+ iface = gr.Interface(
37
+ fn=query,
38
+ inputs='text',
39
+ outputs='text',
40
+ examples=[["Qu'est ce qui t'a fait le plus progresser?"]]
41
+ )
42
+
43
+ iface.launch()