Spaces:

loveblairsky
/

LLM-model-cards

Sleeping

App Files Files Community

Blair Yang commited on Feb 19

Commit

de1d92a

•

1 Parent(s): 07a63f0

Bugs?

Browse files

Files changed (2) hide show

__pycache__/Sample.cpython-311.pyc +0 -0
app.py +40 -45

__pycache__/Sample.cpython-311.pyc CHANGED Viewed

Binary files a/__pycache__/Sample.cpython-311.pyc and b/__pycache__/Sample.cpython-311.pyc differ

app.py CHANGED Viewed

@@ -1,60 +1,55 @@
 import gradio as gr
-from Sample import *
-display_dict, info_dict = sample_random_entry(n=1)
-# Extract the question text
-question_text = display_dict['qa']
-def markdown_to_html(markdown_text):
-    # You would use a Markdown library to convert markdown to HTML here
-    # Since this code runs in an environment without extra libraries, this is a placeholder
-    html = markdown_text.replace("\n", "<br>")  # Simple replacement, not a real markdown conversion
-    return html
-completion_text = ''
-def evaluate_guess(reasoning, correctness, confidence):
-    # Placeholder for comparison logic
-    # You'll need to access the correct answer from `info_dict` or a similar structure
-    correct_answer = "Correctly"  # Placeholder for the actual logic to determine this
     evaluation_response = "Correct" if correctness == correct_answer else "Incorrect"
-    actual_model = info_dict['model']
-    actual_completion = info_dict['completion']
-    # Update the completion text
-    completion_text = f"Completion: {actual_completion}\n\nChoice: {chr(info_dict['verdict'] + 65)}"
-    model = actual_model
-    # Return the evaluation response and the completion text to update the interface
-    return evaluation_response, model, completion_text
-print(display_dict['card'])
 with gr.Blocks() as app:
     with gr.Row():
-        with gr.Column(scale=2):  # This column is wider
-            # Use a Textbox to display the evaluation card content
-            evaluation_card = gr.Textbox(value=display_dict['card'], label="Evaluation Card", interactive=False)
-            model = gr.Textbox(value="", label="Model", placeholder='An anonymous Model', interactive=False)
-            completion = gr.Textbox(value="", label="Model's Completion", interactive=False)
         with gr.Column(scale=1):
-            # Display the sampled question in a Textbox
             question = gr.Textbox(value=question_text, label="Question", interactive=False)
             reasoning = gr.Textbox(lines=5, placeholder="Your reasoning (optional)")
             correctness = gr.Radio(choices=["Correct", "Incorrect"], label="I believe the model will answer this question")
             confidence = gr.Slider(minimum=0, maximum=10, step=1, label="Confidence")
-            output_text = gr.Text(label="Evaluation Output")  # Create an output text component
             submit_button = gr.Button("Submit")
-            # This textbox will be used to display the model's completion
-    # When the button is clicked, it will update the content of the completion textbox
-    submit_button.click(fn=evaluate_guess, inputs=[reasoning, correctness, confidence], outputs=[output_text, model, completion])
-app.launch()

 import gradio as gr
+from Sample import sample_random_entry
+from Config import TOPICS
+info_dict = {}
+def sample_and_display(topic):
+    # If a topic is selected, use it to sample a new entry
+    global info_dict
+    display_dict, info_dict = sample_random_entry(topic=topic) if topic else sample_random_entry()
+    question_text = display_dict['qa']
+    evaluation_card_text = display_dict['card']
+    model_name = ''  # Clear the model name
+    completion_text = ''  # Clear the completion text
+    return question_text, evaluation_card_text, model_name, completion_text
+def evaluate_guess(reasoning, correctness, confidence, topic):
+    global info_dict
+    # Here your logic will go to evaluate the guess
+    # Placeholder for the correct logic to determine the correct answer
+    correct_answer = "Correctly"
     evaluation_response = "Correct" if correctness == correct_answer else "Incorrect"
+    # Assuming info_dict is updated by sample_and_display function
+    actual_model = info_dict.get('model', 'Unknown Model')
+    actual_completion = info_dict.get('completion', 'No completion available.')
+    # Update the completion text
+    completion_text = f"Completion: {actual_completion}\n\nChoice: {chr(info_dict.get('verdict', 0) + 65)}"
+    return evaluation_response, actual_model, completion_text
+# Initial sampling
+initial_topic = TOPICS['mmlu'][0]  # Assuming TOPICS is a list of topics
+question_text, evaluation_card_text, model_name, completion_text = sample_and_display(initial_topic)
 with gr.Blocks() as app:
+    topic = gr.Dropdown(choices=TOPICS['mmlu'], label="Select Topic", value=initial_topic)
     with gr.Row():
+        with gr.Column(scale=2):
+            evaluation_card = gr.Textbox(value=evaluation_card_text, label="Evaluation Card", interactive=False)
+            model = gr.Textbox(value=model_name, label="Model", interactive=False)
+            completion = gr.Textbox(value=completion_text, label="Model's Completion", interactive=False)
         with gr.Column(scale=1):
             question = gr.Textbox(value=question_text, label="Question", interactive=False)
             reasoning = gr.Textbox(lines=5, placeholder="Your reasoning (optional)")
             correctness = gr.Radio(choices=["Correct", "Incorrect"], label="I believe the model will answer this question")
             confidence = gr.Slider(minimum=0, maximum=10, step=1, label="Confidence")
+            output_text = gr.Text(label="Evaluation Output")
             submit_button = gr.Button("Submit")
+            next_button = gr.Button("Next Entry")
+    submit_button.click(fn=evaluate_guess, inputs=[reasoning, correctness, confidence, topic], outputs=[output_text, model, completion])
+    next_button.click(fn=sample_and_display, inputs=[topic], outputs=[question, evaluation_card, model, completion])
+app.launch()