SLM-RAG-Arena

Running on Zero

App Files Files Community

oliver-aizip commited on 1 day ago

Commit

15dd199

1 Parent(s): 347797e

refresh and persistent logging

Browse files

Files changed (3) hide show

app.py +7 -14
utils/leaderboard.py +17 -3
utils/vote_logger.py +19 -10

app.py CHANGED Viewed

@@ -406,36 +406,29 @@ The Elo rating system provides a more accurate ranking than simple win rates:
         outputs=[results_table_display]
     )
-    # Alternative approach: use two separate clicks for each button
-    # First click event: Update UI immediately
     for btn in [random_question_btn, try_another_btn]:
-        # Handle UI updates first
-        event1 = btn.click(
             fn=show_loading_state,
             inputs=[],
             outputs=[summary_a_display, summary_b_display, vote_button_a,
                     vote_button_b, vote_button_tie, vote_button_neither]
         ).then(
             fn=handle_new_example_click,
             inputs=[],
             outputs=[current_example]
         ).then(
             fn=update_ui_for_new_context,
             inputs=[current_example],
             outputs=[query_display, context_description, context_display,
                     context_toggle_btn, show_full_context]
-        )
-    # Second click event for each button runs in parallel with the first
-    for btn in [random_question_btn, try_another_btn]:
-        # Generate model outputs (potentially slower operation)
-        event2 = btn.click(
-            fn=handle_new_example_click,  # This will be called separately from the first event
-            inputs=[],
-            outputs=[current_example]
         ).then(
             fn=process_example,
-            inputs=[current_example],
             outputs=[model_a_name, model_b_name, summary_a_text, summary_b_text,
                     selected_winner, feedback_list, show_results_state, results_agg,
                     summary_a_display, summary_b_display, vote_button_a, vote_button_b,

         outputs=[results_table_display]
     )
+    # Use a single event chain for each button, structured to update UI first, then run inference
     for btn in [random_question_btn, try_another_btn]:
+        btn.click(
+            # Step 1: Show loading state immediately
             fn=show_loading_state,
             inputs=[],
             outputs=[summary_a_display, summary_b_display, vote_button_a,
                     vote_button_b, vote_button_tie, vote_button_neither]
         ).then(
+            # Step 2: Get new example
             fn=handle_new_example_click,
             inputs=[],
             outputs=[current_example]
         ).then(
+            # Step 3: Update context UI immediately
             fn=update_ui_for_new_context,
             inputs=[current_example],
             outputs=[query_display, context_description, context_display,
                     context_toggle_btn, show_full_context]
         ).then(
+            # Step 4: Then process example for model outputs
             fn=process_example,
+            inputs=[current_example],
             outputs=[model_a_name, model_b_name, summary_a_text, summary_b_text,
                     selected_winner, feedback_list, show_results_state, results_agg,
                     summary_a_display, summary_b_display, vote_button_a, vote_button_b,

utils/leaderboard.py CHANGED Viewed

@@ -3,6 +3,7 @@ import pandas as pd
 import math
 from datetime import datetime
 from .models import models
 # Default K-factor (determines how much a single match affects ratings)
 DEFAULT_K_FACTOR = 32
@@ -10,6 +11,18 @@ DEFAULT_K_FACTOR = 32
 # Default starting Elo
 DEFAULT_ELO = 1500
 def prepare_url(model_dict: dict):
     """
     Prepare the URL for the model based on its name.
@@ -119,7 +132,7 @@ def load_leaderboard_data():
     try:
         # Define the path to the CSV file for leaderboard
-        csv_path = os.path.join('utils', 'arena_elo_leaderboard.csv')
         # Check if the file exists and load it
         if os.path.exists(csv_path):
@@ -247,8 +260,9 @@ def save_leaderboard_data(results):
         df = df.sort_values(by='elo', ascending=False)
         # Save to CSV
-        df.to_csv(csv_path, index=False)
-        print(f"Leaderboard data saved successfully to {csv_path}")
     except Exception as e:
         print(f"Error saving leaderboard data: {e}")

 import math
 from datetime import datetime
 from .models import models
+from huggingface_hub import CommitScheduler
 # Default K-factor (determines how much a single match affects ratings)
 DEFAULT_K_FACTOR = 32
 # Default starting Elo
 DEFAULT_ELO = 1500
+LEADERBOARD_FN = './arena_elo_leaderboard.csv'
+csv_path = os.path.join('utils', 'arena_elo_leaderboard.csv')
+leaderboard_scheduler = CommitScheduler(
+    repo_id="aizip-dev/Arena-Metadata",
+    folder_path="leaderboard",
+    repo_type="dataset",
+    every=5
+    )
 def prepare_url(model_dict: dict):
     """
     Prepare the URL for the model based on its name.
     try:
         # Define the path to the CSV file for leaderboard
+        csv_path = LEADERBOARD_FN
         # Check if the file exists and load it
         if os.path.exists(csv_path):
         df = df.sort_values(by='elo', ascending=False)
         # Save to CSV
+        with leaderboard_scheduler.lock:
+            df.to_csv(csv_path, index=False)
+            print(f"Leaderboard data saved successfully to {csv_path}")
     except Exception as e:
         print(f"Error saving leaderboard data: {e}")

utils/vote_logger.py CHANGED Viewed

@@ -3,6 +3,14 @@ import csv
 import json
 from datetime import datetime
 import pandas as pd
 def save_vote_details(example, model_a, model_b, winner, feedback, summary_a, summary_b):
     """
@@ -35,17 +43,18 @@ def save_vote_details(example, model_a, model_b, winner, feedback, summary_a, su
     try:
         # Open the file in append mode
-        with open(csv_path, 'a', newline='', encoding='utf-8') as f:
-            writer = csv.DictWriter(f, fieldnames=vote_record.keys())
-            # Write header if file doesn't exist
-            if not file_exists:
-                writer.writeheader()
-            # Write the vote record
-            writer.writerow(vote_record)
-        print(f"Vote details saved to {csv_path}")
     except Exception as e:
         print(f"Error saving vote details: {e}")

 import json
 from datetime import datetime
 import pandas as pd
+from huggingface_hub import CommitScheduler
+vote_details_scheduler = CommitScheduler(
+    repo_id="aizip-dev/Arena-Metadata",
+    folder_path="votes",
+    repo_type="dataset",
+    every=5
+    )
 def save_vote_details(example, model_a, model_b, winner, feedback, summary_a, summary_b):
     """
     try:
         # Open the file in append mode
+        with vote_details_scheduler:
+            with open(csv_path, 'a', newline='', encoding='utf-8') as f:
+                writer = csv.DictWriter(f, fieldnames=vote_record.keys())
+                # Write header if file doesn't exist
+                if not file_exists:
+                    writer.writeheader()
+                # Write the vote record
+                writer.writerow(vote_record)
+            print(f"Vote details saved to {csv_path}")
     except Exception as e:
         print(f"Error saving vote details: {e}")