Spaces:

DeepJudge
/

Applicant-Task-Submission

Running

App Files Files

Timothy-Vinzent commited on Feb 19

Commit

c1cd0b6

verified ·

1 Parent(s): 3f8b483

Update app.py

Browse files

Files changed (1) hide show

app.py +27 -3

app.py CHANGED Viewed

@@ -22,7 +22,7 @@ def get_evaluation_questions():
     Both lists must be of equal length.
     """
     questions_str = os.environ.get("TEST_QUESTION_1")
-    expected_str = os.environ.get("TEST_EXPECTED")
     if not questions_str or not expected_str:
         return []
     try:
@@ -126,10 +126,34 @@ def build_interface():
     Constructs the Gradio interface with a submission button and single-submission mechanism.
     """
     with gr.Blocks() as demo:
-        gr.Markdown("# GPT-4o Mini Prompt Submission")
         gr.Markdown(
             "Please enter your details and submit your system prompt below. "
-            "You can only submit once."
         )
         email_input = gr.Textbox(label="Email", placeholder="your.email@example.com")

     Both lists must be of equal length.
     """
     questions_str = os.environ.get("TEST_QUESTION_1")
+    expected_str = os.environ.get("TEST_EXPECTED_1")
     if not questions_str or not expected_str:
         return []
     try:
     Constructs the Gradio interface with a submission button and single-submission mechanism.
     """
     with gr.Blocks() as demo:
+        gr.Markdown("# GPT-4o Mini System Prompt Submission")
+        gr.Markdown("""Classification Task: Document and Clause Level Identification
+                    Challenge Description
+                    Participants must create a system prompt for a language model that classifies user queries about legal documents into two specific categories:"
+                    1. Document Level: Determines whether the query refers to a single document or multiple documents.
+                    2. Clause Level: Identifies whether the query is focused on:
+                        - A single clause,
+                        - Multiple clauses, or
+                        - General information not constrained to any specific clause.
+                    The model must return a valid JSON object with the following structure:
+                    json```
+                    {
+                      "document_level": "single/multiple",
+                      "clause_level": "single/multiple/general"
+                    }```
+                    The goal is to ensure that the model's output is concise, structured, and accurate. This task is designed to evaluate the robustness of the system prompt in handling classification tasks with short, precise outputs.
+                    """)
         gr.Markdown(
             "Please enter your details and submit your system prompt below. "
+            "You can only submit once, I suggest trying to test and build out the system prompt using the same LM being used here elsewhere before submitting."
         )
         email_input = gr.Textbox(label="Email", placeholder="your.email@example.com")