jaimin commited on
Commit
92824c7
1 Parent(s): bcdf874

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +26 -20
app.py CHANGED
@@ -5,32 +5,37 @@ import gradio as gr
5
  import nltk
6
  from nltk.tokenize import word_tokenize
7
  import re
 
8
  nltk.download('punkt')
9
 
10
  model_name = "deepset/roberta-base-squad2"
11
  model = AutoModelForQuestionAnswering.from_pretrained(model_name)
12
  tokenizer = AutoTokenizer.from_pretrained(model_name)
13
 
14
- def bullete(text,wikipedia_language="en"):
15
- try:
16
- question_words = STOPWORDS.union(set(['likes','play','.',',','like',"don't",'?','use','choose','important','better','?']))
17
- lower_text = text.lower()
18
- lower_text = word_tokenize(lower_text)
19
- new_text = [i for i in lower_text if i not in question_words]
20
- new_txt = "".join(new_text)
21
- if wikipedia_language:
22
- wikipedia.set_lang(wikipedia_language)
23
-
24
- et_page = wikipedia.page(new_txt.replace(" ", ""))
25
- title = et_page.title
26
- content = et_page.content
27
- page_url = et_page.url
28
- linked_pages = et_page.links
29
-
30
- text1 = content
 
 
 
 
31
  final_out = re.sub(r'\=.+\=', '', text1)
32
  result = list(filter(lambda x: x != '', final_out.split('\n\n')))
33
-
34
  answer = []
35
  try:
36
  for i in range(len(result[0].split('.'))):
@@ -51,11 +56,12 @@ def bullete(text,wikipedia_language="en"):
51
  final_answer = paraphrase.replace(" ", " ")
52
  return final_answer
53
 
54
- except:
55
- return "Please write correct wikipedia article name OR question"
56
  interface = gr.Interface(fn=bullete,
57
  inputs="text",
58
  outputs="text",
59
  title='Bullet Point')
60
 
61
  interface.launch(inline=False)
 
5
  import nltk
6
  from nltk.tokenize import word_tokenize
7
  import re
8
+
9
  nltk.download('punkt')
10
 
11
  model_name = "deepset/roberta-base-squad2"
12
  model = AutoModelForQuestionAnswering.from_pretrained(model_name)
13
  tokenizer = AutoTokenizer.from_pretrained(model_name)
14
 
15
+
16
+ def bullete(text, wikipedia_language="en"):
17
+ question_words = STOPWORDS.union(
18
+ set(['likes', 'play', '.', ',', 'like', "don't", '?', 'use', 'choose', 'important', 'better', '?']))
19
+ try:
20
+ lower_text = text.lower()
21
+ lower_text = word_tokenize(lower_text)
22
+ new_text = [i for i in lower_text if i not in question_words]
23
+ new_txt = "".join(new_text)
24
+ if wikipedia_language:
25
+ wikipedia.set_lang(wikipedia_language)
26
+
27
+ et_page = wikipedia.page(new_txt.replace(" ", ""))
28
+ title = et_page.title
29
+ content = et_page.content
30
+ page_url = et_page.url
31
+ linked_pages = et_page.links
32
+
33
+ text1 = content
34
+ except:
35
+ return "Please write correct question"
36
  final_out = re.sub(r'\=.+\=', '', text1)
37
  result = list(filter(lambda x: x != '', final_out.split('\n\n')))
38
+
39
  answer = []
40
  try:
41
  for i in range(len(result[0].split('.'))):
56
  final_answer = paraphrase.replace(" ", " ")
57
  return final_answer
58
 
59
+
60
+
61
  interface = gr.Interface(fn=bullete,
62
  inputs="text",
63
  outputs="text",
64
  title='Bullet Point')
65
 
66
  interface.launch(inline=False)
67
+