ARFBench

Running

sxie78-dd commited on Jul 7, 2025

Commit

5e9eb9b

verified ·

1 Parent(s): d0bffeb

Update src/about.py

Files changed (1) hide show

src/about.py CHANGED Viewed

@@ -21,19 +21,20 @@ NUM_FEWSHOT = 0 # Change with your few shot
 # Your leaderboard name
-TITLE = """<h1 align="center" id="space-title">Demo leaderboard</h1>"""
 # What does your leaderboard evaluate?
 INTRODUCTION_TEXT = """
-Intro text
 """
 # Which evaluations are you running? how can people reproduce what you have?
 LLM_BENCHMARKS_TEXT = f"""
-## How it works
 ## Reproducibility
-To reproduce our results, here is the commands you can run:
 """

 # Your leaderboard name
+TITLE = """<h1 align="center" id="space-title">ARFBench Multimodal Time Series Reasoning Leaderboard</h1>"""
 # What does your leaderboard evaluate?
 INTRODUCTION_TEXT = """
+**ARF**Bench (**A**nomaly **R**easoning **F**ramework Benchmark) is a multimodal time-series reasoning benchmark consisting of 550 question-answer (QA) pairs composed from
+real-world incident data collected at Datadog, a leading observability platform.
 """
 # Which evaluations are you running? how can people reproduce what you have?
 LLM_BENCHMARKS_TEXT = f"""
+For more details on the benchmark, refer to the [ARFBench dataset card](https://huggingface.co/datasets/Datadog/ARFBench)
 ## Reproducibility
+Coming soon!
 """