Spaces:

agenticx
/

TxAgentRAOEval

Sleeping

App Files Files Community

shgao commited on Jun 3

Commit

0433ab9

1 Parent(s): 2e80564

update

Browse files

Files changed (1) hide show

app.py +11 -11

app.py CHANGED Viewed

@@ -515,6 +515,7 @@ def go_to_eval_progress_modal(name, email, evaluator_id, specialty_dd, subspecia
     # Map advance_workflow outputs to the required return format
     # advance_workflow 已经确保返回正确长度的列表，不需要额外检查
     return (
             gr.update(visible=False),                                   # page0
             ui_updates.get('page1_visible', gr.update(visible=False)),  # page1
@@ -525,7 +526,7 @@ def go_to_eval_progress_modal(name, email, evaluator_id, specialty_dd, subspecia
             ui_updates.get('page2_prompt', ""),                         # page2_prompt
             data_subset_state['reference_answer'],        # page1_reference_answer
             data_subset_state['reference_answer'],        # page2_reference_answer
-            f"You are about to evaluate the next question. You have {remaining_count} question(s) remaining to evaluate.",  # eval_progress_text
             user_info,                                                  # user_info_state
             data_subset_state,                                          # data_subset_state
             ui_updates.get('progress_state', progress_state),           # progress_state
@@ -1310,14 +1311,14 @@ def advance_workflow(progress_state, data_subset_state, current_pairwise=None, c
             'progress_state': progress_state,
             'page1_visible': gr.update(visible=True),  # Keep page1 visible
             'page2_visible': gr.update(visible=False),  # Hide page2
-            'pairwise_radios': [gr.update() for _ in range(criteria_for_comparison)],
             'pairwise_reasons': [gr.update() for _ in range(len_criteria)],
             'chat_a_page1': gr.update(), # Keep chat_a unchanged
             'chat_b_page1': gr.update(), # Keep chat_b unchanged
             'page1_prompt': gr.update(), # Keep page1_prompt unchanged
             'chat_a_page2': gr.update(),  # Keep chat_a_page2 unchanged
             'chat_b_page2': gr.update(),  # Keep chat_b_page2 unchanged
-            'page2_prompt': gr.update(),  # Keep chat_b_page2 unchanged
             'pairwise_results_for_display': default_pairwise_results
         }
@@ -1685,7 +1686,8 @@ def submit_pairwise_scoring(progress_state, data_subset_state, user_info, *ratin
     # Use advance_workflow to get all UI updates
     ui_updates = advance_workflow(progress_state, data_subset_state)
     print(f"\033[93mIn submit_pairwise_scoring, using advance_workflow results: mode={progress_state.get('mode')}\033[0m")
-    gr.Info(f"You are about to evaluate the next question. You have {remaining_count} question(s) remaining to evaluate.")  # eval_progress_text
     return (
             ui_updates.get('page1_visible'),                           # 5
             ui_updates.get('page2_visible'),                           # 6
@@ -1949,9 +1951,7 @@ with gr.Blocks(css=centered_col_css) as demo:
         - If you wish to evaluate multiple questions, you may do so; you will never be asked to re-evaluate questions you have already seen.
         - When evaluating a question, you will be asked to compare the responses of two different models to the question and then rate each model's response on a scale of 1-5.
         - If you feel that a question does not make sense or is not biomedically relevant, there is a RED BUTTON at the top of the first model comparison page to indicate this
-        - You may use the Back and Next buttons at the bottom of each page to edit any of your responses before submitting.
-        - You may use the Home Page button at the bottom of each page to the home page. Your progress will be saved but not submitted.
-        - You must submit your answers to the current question before moving on to evaluate the next question.
         - You may stop in between questions and return at a later time; however, you must submit your answers to the current question if you would like them saved.
         - Please review the example question and LLM model response below:
@@ -2114,12 +2114,12 @@ with gr.Blocks(css=centered_col_css) as demo:
         page1_error_box = gr.Markdown("")  # ADDED: display validation errors
         with gr.Row():
             # back_btn_0 = gr.Button("Back")
-            next_btn_1 = gr.Button("Next: Rate Responses")
         with gr.Row():
             # ADDED: Home button on page11
             home_btn_1 = gr.Button(
-                "Home Page (your progress on this question will be saved but not submitted)")
     # Page 2: Combined Rating Page for both responses.
     with gr.Column(visible=False) as page2:
@@ -2214,11 +2214,11 @@ with gr.Blocks(css=centered_col_css) as demo:
         with gr.Row():
             # back_btn_2 = gr.Button("Back")
             submit_btn = gr.Button(
-                "Submit (Note: Once submitted, you cannot edit your responses)", elem_id="submit_btn")
         with gr.Row():
             home_btn_2 = gr.Button(
-                "Home Page (your progress on this question will be saved but not submitted)")
         result_text = gr.Textbox(label="Validation Result")

     # Map advance_workflow outputs to the required return format
     # advance_workflow 已经确保返回正确长度的列表，不需要额外检查
+    num_remaining_questions = remaining_count// len(progress_state['all_pairs'])
     return (
             gr.update(visible=False),                                   # page0
             ui_updates.get('page1_visible', gr.update(visible=False)),  # page1
             ui_updates.get('page2_prompt', ""),                         # page2_prompt
             data_subset_state['reference_answer'],        # page1_reference_answer
             data_subset_state['reference_answer'],        # page2_reference_answer
+            f"You are about to evaluate the next question. You have {num_remaining_questions} question(s) remaining to evaluate.",  # eval_progress_text
             user_info,                                                  # user_info_state
             data_subset_state,                                          # data_subset_state
             ui_updates.get('progress_state', progress_state),           # progress_state
             'progress_state': progress_state,
             'page1_visible': gr.update(visible=True),  # Keep page1 visible
             'page2_visible': gr.update(visible=False),  # Hide page2
+            'pairwise_radios': [gr.update() for _ in range(len_criteria)],
             'pairwise_reasons': [gr.update() for _ in range(len_criteria)],
             'chat_a_page1': gr.update(), # Keep chat_a unchanged
             'chat_b_page1': gr.update(), # Keep chat_b unchanged
             'page1_prompt': gr.update(), # Keep page1_prompt unchanged
             'chat_a_page2': gr.update(),  # Keep chat_a_page2 unchanged
             'chat_b_page2': gr.update(),  # Keep chat_b_page2 unchanged
+            'page2_prompt': gr.update(),  # Keep page2_prompt unchanged
             'pairwise_results_for_display': default_pairwise_results
         }
     # Use advance_workflow to get all UI updates
     ui_updates = advance_workflow(progress_state, data_subset_state)
     print(f"\033[93mIn submit_pairwise_scoring, using advance_workflow results: mode={progress_state.get('mode')}\033[0m")
+    num_remaining_questions = remaining_count// len(progress_state['all_pairs'])
+    gr.Info(f"You are about to evaluate the next question. You have {num_remaining_questions} question(s) remaining to evaluate.")  # eval_progress_text
     return (
             ui_updates.get('page1_visible'),                           # 5
             ui_updates.get('page2_visible'),                           # 6
         - If you wish to evaluate multiple questions, you may do so; you will never be asked to re-evaluate questions you have already seen.
         - When evaluating a question, you will be asked to compare the responses of two different models to the question and then rate each model's response on a scale of 1-5.
         - If you feel that a question does not make sense or is not biomedically relevant, there is a RED BUTTON at the top of the first model comparison page to indicate this
+        - You may use the Next buttons at the bottom of each page to submit your current response and go to the next question.
         - You may stop in between questions and return at a later time; however, you must submit your answers to the current question if you would like them saved.
         - Please review the example question and LLM model response below:
         page1_error_box = gr.Markdown("")  # ADDED: display validation errors
         with gr.Row():
             # back_btn_0 = gr.Button("Back")
+            next_btn_1 = gr.Button("Submit & Next One (Once submitted, you cannot edit your responses)",)
         with gr.Row():
             # ADDED: Home button on page11
             home_btn_1 = gr.Button(
+                "Home Page")
     # Page 2: Combined Rating Page for both responses.
     with gr.Column(visible=False) as page2:
         with gr.Row():
             # back_btn_2 = gr.Button("Back")
             submit_btn = gr.Button(
+                "Submit & Next One (Once submitted, you cannot edit your responses)", elem_id="submit_btn")
         with gr.Row():
             home_btn_2 = gr.Button(
+                "Home Page")
         result_text = gr.Textbox(label="Validation Result")