Spaces:

GTBench
/

GTBench

Running

Renming Zhang commited on Feb 15

Commit

43feb65

•

1 Parent(s): 55aff67

added image

Files changed (3) hide show

app.py CHANGED Viewed

@@ -24,6 +24,7 @@ from src.display.utils import (
     Precision
 )
 from src.envs import API, EVAL_REQUESTS_PATH, EVAL_RESULTS_PATH, H4_TOKEN, IS_PUBLIC, QUEUE_REPO, REPO_ID, RESULTS_REPO
 # from src.populate import get_evaluation_queue_df, get_leaderboard_df
 # from src.submission.submit import add_new_eval
 # from src.tools.collections import update_collections
@@ -207,7 +208,7 @@ class LLM_Model:
 games = ["Breakthrough", "Connect Four", "Blind Auction", "Kuhn Poker",
-         "Liar's Dice", "Negotiation", "Nim", "Pig", "Iterated Prisoners Dilemma", "Tic-Tac-Toe"]
 # models = ["gpt-35-turbo-1106", "gpt-4", "Llama-2-70b-chat-hf", "CodeLlama-34b-Instruct-hf",
 #           "CodeLlama-70b-Instruct-hf", "Mistral-7B-Instruct-v01", "Mistral-7B-OpenOrca"]
@@ -217,10 +218,18 @@ games = ["Breakthrough", "Connect Four", "Blind Auction", "Kuhn Poker",
 demo = gr.Blocks(css=custom_css)
 with demo:
     gr.HTML(TITLE)
-    gr.Markdown(INTRODUCTION_TEXT, elem_classes="markdown-text")
     with gr.Tabs(elem_classes="tab-buttons") as tabs:
         with gr.TabItem("🏅 GTBench", elem_id="llm-benchmark-tab-table", id=0):
             with gr.Row():

     Precision
 )
 from src.envs import API, EVAL_REQUESTS_PATH, EVAL_RESULTS_PATH, H4_TOKEN, IS_PUBLIC, QUEUE_REPO, REPO_ID, RESULTS_REPO
+from PIL import Image
 # from src.populate import get_evaluation_queue_df, get_leaderboard_df
 # from src.submission.submit import add_new_eval
 # from src.tools.collections import update_collections
 games = ["Breakthrough", "Connect Four", "Blind Auction", "Kuhn Poker",
+         "Liar's Dice", "Negotiation", "Nim", "Pig", "Iterated Prisoner's Dilemma", "Tic-Tac-Toe"]
 # models = ["gpt-35-turbo-1106", "gpt-4", "Llama-2-70b-chat-hf", "CodeLlama-34b-Instruct-hf",
 #           "CodeLlama-70b-Instruct-hf", "Mistral-7B-Instruct-v01", "Mistral-7B-OpenOrca"]
 demo = gr.Blocks(css=custom_css)
+def load_image(image_path):
+    image = Image.open(image_path)
+    return image
 with demo:
+    gr.Image("./assets/logo.png", height="200px", width="200px",
+             show_download_button=False, container=False)
     gr.HTML(TITLE)
+    gr.Markdown(INTRODUCTION_TEXT, elem_classes="markdown-text")
     with gr.Tabs(elem_classes="tab-buttons") as tabs:
         with gr.TabItem("🏅 GTBench", elem_id="llm-benchmark-tab-table", id=0):
             with gr.Row():

assets/logo.png ADDED Viewed

src/display/about.py CHANGED Viewed

@@ -1,7 +1,6 @@
 # from src.display.utils import ModelType
 TITLE = """
-<embed src="../../assets/logo.pdf" width="200px" height="200px" />
 <h1 align="center" id="space-title">GTBench: Uncovering the Strategic Reasoning Limitation of LLMs via Game-Theoretic Evaluations</h1>"""
 INTRODUCTION_TEXT = """

 # from src.display.utils import ModelType
 TITLE = """
 <h1 align="center" id="space-title">GTBench: Uncovering the Strategic Reasoning Limitation of LLMs via Game-Theoretic Evaluations</h1>"""
 INTRODUCTION_TEXT = """