Spaces:

oliverwang15
/

DAN_AI

Running

App Files Files Community

oliverwang15 commited on Feb 12

Commit

9ad1d3a

•

1 Parent(s): 9ec1c48

Change outlook and add hard questions

Browse files

Files changed (6) hide show

app.py +36 -21
backend.py +119 -34
offline_results/exp_ga.csv +0 -0
offline_results/exp_ga_old.csv +0 -0
offline_results/exp_gb.csv +0 -0
offline_results/exp_gb_old.csv +0 -0

app.py CHANGED Viewed

@@ -14,6 +14,12 @@ QUESTIONS = [
     "Intervention 1",
     "Intervention 2",
     "Genetic Chain",
 ]
 with gr.Blocks(theme="dark") as demo:
@@ -23,31 +29,40 @@ with gr.Blocks(theme="dark") as demo:
                         <center> <h4> Please follow the Instruction <a href="https://huggingface.co/spaces/oliverwang15/DAN_AI/blob/main/README.md">HERE</a> </h4> </center>')
     with gr.Row():
         with gr.Row():
-            # Update
             with gr.Group():
-                gr.Markdown(f'<center><h1>Input</h1></center>')
-                gr.Markdown(f'<center><p>Please First Upload the File</p></center>')
-                with gr.Group():
-                    gr.Markdown(f'<center><h2>Request Online</h2></center>')
-                    openai_key = gr.Textbox(
-                        label='Enter your OpenAI API key here',
-                        type='password')
-                    model_selection = gr.Radio(choices = ["ChatGPT", "GPT4"], label="Model Selection", info="Please select the model you want to use")
-                    file = gr.File(label='Upload your .txt or .pdf file here', file_types=['.txt', '.pdf'], file_count = 'multiple')
-                    btn_submit_txt_online = gr.Button(value='Submit')
-                    # btn_submit_txt.style(full_width=True)
-                with gr.Group():
-                    gr.Markdown(f'<center><h2>Or Load Offline</h2></center>')
-                    questions = gr.CheckboxGroup(choices = QUESTIONS, value = QUESTIONS, label="Questions (Please don't change this part now)", info="Please select the question you want to ask")
-                    answer_type = gr.Radio(choices = ["ChatGPT_txt", "GPT4_txt", 'New_GPT_4_pdf', 'Exp_training', 'Exp_Group_A', 'Exp_Group_B'], label="Answer_type", info="Please select the type of answer you want to show")
-                    btn_submit_txt_offline = gr.Button(value='Show Answers')
-                    # btn_submit_txt.style(full_width=True)
             # Output
             with gr.Group():

     "Intervention 1",
     "Intervention 2",
     "Genetic Chain",
+    "Issues or Challenge Resolved",
+    "Innovations in Methodology",
+    "Impact of Findings",
+    "limitations",
+    "Potential Applications",
 ]
 with gr.Blocks(theme="dark") as demo:
                         <center> <h4> Please follow the Instruction <a href="https://huggingface.co/spaces/oliverwang15/DAN_AI/blob/main/README.md">HERE</a> </h4> </center>')
     with gr.Row():
+        # Update
+        # with gr.Group():
+        # gr.Markdown(f'<center><h1>Input</h1></center>')
         with gr.Row():
+            # Online
             with gr.Group():
+                gr.Markdown(f'<center><h2>Request Online</h2></center>')
+                # gr.Markdown(f'<center><p>Please First Upload the File</p></center>')
+                with gr.Row():
+                    with gr.Group():
+                        openai_key = gr.Textbox(
+                            label='Enter your OpenAI API key here',
+                            type='password')
+                    with gr.Group():
+                        model_selection = gr.Radio(choices = ["ChatGPT", "GPT4"], label="Model Selection", info="Please select the model you want to use")
+                file = gr.File(label='Upload your .txt or .pdf file here', file_types=['.txt', '.pdf'], file_count = 'multiple')
+                btn_submit_txt_online = gr.Button(value='Submit')
+                # btn_submit_txt.style(full_width=True)
+            # Offline
+            with gr.Group():
+                gr.Markdown(f'<center><h2>Or Load Offline</h2></center>')
+                questions = gr.CheckboxGroup(choices = QUESTIONS, value = QUESTIONS[:6], label="Questions (Please don't change this part now)", info="Please select the question you want to ask")
+                answer_type = gr.Radio(choices = ["ChatGPT_txt", "GPT4_txt", 'New_GPT_4_pdf', 'Exp_training', 'Exp_Group_A', 'Exp_Group_B'], label="Answer_type", info="Please select the type of answer you want to show")
+                btn_submit_txt_offline = gr.Button(value='Show Answers')
+                # btn_submit_txt.style(full_width=True)
+    with gr.Row():
+        with gr.Row():
             # Output
             with gr.Group():

backend.py CHANGED Viewed

@@ -8,6 +8,34 @@ import pandas as pd
 import os,json
 import time
 class Backend:
     def __init__(self):
         self.agent = OpenAI()
@@ -184,7 +212,8 @@ class Backend:
             # self.current_question -= 1
             return "No more questions!", "No more questions!", "No more questions!", "No more questions!", "No more questions!", 'No more questions!', 'No more questions!', 'Still need to click the button above to save the results', None, None
         else:
-            res = self.gpt_result[f'Question {self.current_question + 1}']
             question = self.questions[self.current_question]
             self.answer = res['answer']
             self.highlighted_out = res['original sentences']
@@ -208,7 +237,8 @@ class Backend:
             # self.current_question += 1
             return "No more questions!", "No more questions!", "No more questions!", "No more questions!", "No more questions!", 'No more questions!', 'No more questions!', 'Still need to click the button above to save the results', None, None
         else:
-            res = self.gpt_result[f'Question {self.current_question + 1}']
             question = self.questions[self.current_question]
             self.answer = res['answer']
             self.highlighted_out = res['original sentences']
@@ -318,43 +348,96 @@ class Backend:
             else:
                 return "No answer yet, you need to submit the document first"
-    def phase_df(self, df):
         df = json.loads(df.T.to_json())
         res_list = []
         for key, item in df.items():
             tmp_res_list = {}
-            tep_res_list_q1 = {
-                'answer': item['Question 1'],
-                'original sentences': eval(item['Question 1_original_sentences']),
-            }
-            tep_res_list_q2 = {
-                'answer': item['Question 2'],
-                'original sentences': eval(item['Question 2_original_sentences']),
-            }
-            tep_res_list_q3 = {
-                'answer': item['Question 3'],
-                'original sentences': eval(item['Question 3_original_sentences']),
-            }
-            tep_res_list_q4 = {
-                'answer': item['intervention_1'],
-                'original sentences': eval(item['Question 4intervention_1_original_sentences']),
-            }
-            tep_res_list_q5 = {
-                'answer': item['intervention_2'],
-                'original sentences': eval(item['Question 4intervention_2_original_sentences']),
-            }
-            tep_res_list_q6 = {
-                'answer': item['Question 5'],
-                'original sentences': eval(item['Question 5_original_sentences']),
-            }
-            tmp_res_list['Question 1'] = tep_res_list_q1
-            tmp_res_list['Question 2'] = tep_res_list_q2
-            tmp_res_list['Question 3'] = tep_res_list_q3
-            tmp_res_list['Question 4'] = tep_res_list_q4
-            tmp_res_list['Question 5'] = tep_res_list_q5
-            tmp_res_list['Question 6'] = tep_res_list_q6
             res_list.append(tmp_res_list)
         return res_list
     def process_file_offline(self, questions, answer_type, progress = gr.Progress()):
@@ -377,7 +460,7 @@ class Backend:
             df = pd.read_csv('./offline_results/exp_gb.csv')
         # make the prompt
-        self.res_list = self.phase_df(df)
         if answer_type in ['ChatGPT_txt', 'GPT4_txt', 'New_GPT_4_pdf']:
             if answer_type == 'ChatGPT_txt' or answer_type == 'GPT4_txt':
@@ -403,6 +486,8 @@ class Backend:
         elif answer_type in ['Exp_training', 'Exp_Group_A', 'Exp_Group_B']:
             self.filename_list = df['fn'].tolist()
             self.text_list = df['content'].tolist()

 import os,json
 import time
+QUESTION_DICT = {
+    "Question 1": "Animal Type",
+    "Question 2": "Exposure Age",
+    "Question 3": "Behavior Test",
+    "intervention_1": "Intervention 1",
+    "intervention_2": "Intervention 2",
+    "Question 5": "Genetic Chain",
+    "Question 6": "Issues or Challenge Resolved",
+    "Question 7": "Innovations in Methodology",
+    "Question 8": "Impact of Findings",
+    "Question 9": "limitations",
+    "Question 10": "Potential Applications",
+}
+REVERSE_QUESTION_DICT = {
+    "Animal Type": "Question 1",
+    "Exposure Age": "Question 2",
+    "Behavior Test": "Question 3",
+    "Intervention 1": "Question 4",
+    "Intervention 2": "Question 5",
+    "Genetic Chain": "Question 6",
+    "Issues or Challenge Resolved": "Question 7",
+    "Innovations in Methodology": "Question 8",
+    "Impact of Findings": "Question 9",
+    "limitations": "Question 10",
+    "Potential Applications": "Question 11",
+}
 class Backend:
     def __init__(self):
         self.agent = OpenAI()
             # self.current_question -= 1
             return "No more questions!", "No more questions!", "No more questions!", "No more questions!", "No more questions!", 'No more questions!', 'No more questions!', 'Still need to click the button above to save the results', None, None
         else:
+            # res = self.gpt_result[f'Question {self.current_question + 1}']
+            res = self.gpt_result[list(self.gpt_result.keys())[self.current_question]]
             question = self.questions[self.current_question]
             self.answer = res['answer']
             self.highlighted_out = res['original sentences']
             # self.current_question += 1
             return "No more questions!", "No more questions!", "No more questions!", "No more questions!", "No more questions!", 'No more questions!', 'No more questions!', 'Still need to click the button above to save the results', None, None
         else:
+            # res = self.gpt_result[f'Question {self.current_question + 1}']
+            res = self.gpt_result[list(self.gpt_result.keys())[self.current_question]]
             question = self.questions[self.current_question]
             self.answer = res['answer']
             self.highlighted_out = res['original sentences']
             else:
                 return "No answer yet, you need to submit the document first"
+    def phase_df(self, df, questions):
         df = json.loads(df.T.to_json())
         res_list = []
         for key, item in df.items():
             tmp_res_list = {}
+            if 'Question 1' in item and "Animal Type" in questions:
+                tep_res_list_q1 = {
+                    'answer': item['Question 1'],
+                    'original sentences': eval(item['Question 1_original_sentences']),
+                }
+                tmp_res_list['Question 1'] = tep_res_list_q1
+            if 'Question 2' in item and 'Exposure Age' in questions:
+                tep_res_list_q2 = {
+                    'answer': item['Question 2'],
+                    'original sentences': eval(item['Question 2_original_sentences']),
+                }
+                tmp_res_list['Question 2'] = tep_res_list_q2
+            if 'Question 3' in item and 'Behavior Test' in questions:
+                tep_res_list_q3 = {
+                    'answer': item['Question 3'],
+                    'original sentences': eval(item['Question 3_original_sentences']),
+                }
+                tmp_res_list['Question 3'] = tep_res_list_q3
+            if 'intervention_1' in item and "Intervention 1" in questions:
+                tep_res_list_q4 = {
+                    'answer': item['intervention_1'],
+                    'original sentences': eval(item['Question 4intervention_1_original_sentences']),
+                }
+                tmp_res_list['Question 4'] = tep_res_list_q4
+            if 'intervention_2' in item and "Intervention 2" in questions:
+                tep_res_list_q5 = {
+                    'answer': item['intervention_2'],
+                    'original sentences': eval(item['Question 4intervention_2_original_sentences']),
+                }
+                tmp_res_list['Question 5'] = tep_res_list_q5
+            if 'Question 5' in item and "Genetic Chain" in questions:
+                tep_res_list_q6 = {
+                    'answer': item['Question 5'],
+                    'original sentences': eval(item['Question 5_original_sentences']),
+                }
+                tmp_res_list['Question 6'] = tep_res_list_q6
+            if 'Question 6' in item and "Issues or Challenge Resolved" in questions:
+                tep_res_list_q7 = {
+                    'answer': item['Question 6'],
+                    'original sentences': eval(item['Question 6_original_sentences']),
+                }
+                tmp_res_list['Question 7'] = tep_res_list_q7
+            if 'Question 7' in item and "Innovations in Methodology" in questions:
+                tep_res_list_q8 = {
+                    'answer': item['Question 7'],
+                    'original sentences': eval(item['Question 7_original_sentences']),
+                }
+                tmp_res_list['Question 8'] = tep_res_list_q8
+            if 'Question 8' in item and "Impact of Findings" in questions:
+                tep_res_list_q9 = {
+                    'answer': item['Question 8'],
+                    'original sentences': eval(item['Question 8_original_sentences']),
+                }
+                tmp_res_list['Question 9'] = tep_res_list_q9
+            if 'Question 9' in item and "limitations" in questions:
+                tep_res_list_q10 = {
+                    'answer': item['Question 9'],
+                    'original sentences': eval(item['Question 9_original_sentences']),
+                }
+                tmp_res_list['Question 10'] = tep_res_list_q10
+            if 'Question 10' in item and "Potential Applications" in questions:
+                tep_res_list_q11 = {
+                    'answer': item['Question 10'],
+                    'original sentences': eval(item['Question 10_original_sentences']),
+                }
+                tmp_res_list['Question 11'] = tep_res_list_q11
             res_list.append(tmp_res_list)
+            # checking
+            for i in questions:
+                if REVERSE_QUESTION_DICT[i] not in tmp_res_list:
+                    raise gr.Error(f"Question {i} is not in the answer list, Please don't select it!")
         return res_list
     def process_file_offline(self, questions, answer_type, progress = gr.Progress()):
             df = pd.read_csv('./offline_results/exp_gb.csv')
         # make the prompt
+        self.res_list = self.phase_df(df, questions)
         if answer_type in ['ChatGPT_txt', 'GPT4_txt', 'New_GPT_4_pdf']:
             if answer_type == 'ChatGPT_txt' or answer_type == 'GPT4_txt':
         elif answer_type in ['Exp_training', 'Exp_Group_A', 'Exp_Group_B']:
             self.filename_list = df['fn'].tolist()
+            if "Passage" not in self.filename_list[0]:
+                self.filename_list = [f"[ Passage {i + 1}/{len(self.filename_list)} ] {self.filename_list[i]}" for i in range(len(self.filename_list))]
             self.text_list = df['content'].tolist()

offline_results/exp_ga.csv CHANGED Viewed

The diff for this file is too large to render. See raw diff

offline_results/exp_ga_old.csv ADDED Viewed

The diff for this file is too large to render. See raw diff

offline_results/exp_gb.csv CHANGED Viewed

The diff for this file is too large to render. See raw diff

offline_results/exp_gb_old.csv ADDED Viewed

The diff for this file is too large to render. See raw diff