Chibu Ukachi commited on
Commit ·
ee8242c
1
Parent(s): 79613cc
replace org name
Browse files
every_eval_ever/aime25.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
{
|
| 2 |
"schema_version": "0.2.2",
|
| 3 |
-
"evaluation_id": "aime25/
|
| 4 |
"evaluation_timestamp": "7718166",
|
| 5 |
"retrieved_timestamp": "1777568692.163912",
|
| 6 |
"source_metadata": {
|
|
@@ -14,9 +14,9 @@
|
|
| 14 |
"version": "v0.13.0"
|
| 15 |
},
|
| 16 |
"model_info": {
|
| 17 |
-
"name": "
|
| 18 |
-
"id": "
|
| 19 |
-
"developer": "
|
| 20 |
"inference_engine": {
|
| 21 |
"name": "vllm"
|
| 22 |
},
|
|
|
|
| 1 |
{
|
| 2 |
"schema_version": "0.2.2",
|
| 3 |
+
"evaluation_id": "aime25/RedHatAI/MiniMax-M2.5.w8a8/1777568692.163912",
|
| 4 |
"evaluation_timestamp": "7718166",
|
| 5 |
"retrieved_timestamp": "1777568692.163912",
|
| 6 |
"source_metadata": {
|
|
|
|
| 14 |
"version": "v0.13.0"
|
| 15 |
},
|
| 16 |
"model_info": {
|
| 17 |
+
"name": "RedHatAI/MiniMax-M2.5.w8a8",
|
| 18 |
+
"id": "RedHatAI/MiniMax-M2.5.w8a8",
|
| 19 |
+
"developer": "RedHatAI",
|
| 20 |
"inference_engine": {
|
| 21 |
"name": "vllm"
|
| 22 |
},
|
every_eval_ever/gpqa_diamond.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
{
|
| 2 |
"schema_version": "0.2.2",
|
| 3 |
-
"evaluation_id": "gpqa:diamond/
|
| 4 |
"evaluation_timestamp": "7704068",
|
| 5 |
"retrieved_timestamp": "1777568737.410978",
|
| 6 |
"source_metadata": {
|
|
@@ -14,9 +14,9 @@
|
|
| 14 |
"version": "v0.13.0"
|
| 15 |
},
|
| 16 |
"model_info": {
|
| 17 |
-
"name": "
|
| 18 |
-
"id": "
|
| 19 |
-
"developer": "
|
| 20 |
"inference_engine": {
|
| 21 |
"name": "vllm"
|
| 22 |
},
|
|
|
|
| 1 |
{
|
| 2 |
"schema_version": "0.2.2",
|
| 3 |
+
"evaluation_id": "gpqa:diamond/RedHatAI/MiniMax-M2.5.w8a8/1777568737.410978",
|
| 4 |
"evaluation_timestamp": "7704068",
|
| 5 |
"retrieved_timestamp": "1777568737.410978",
|
| 6 |
"source_metadata": {
|
|
|
|
| 14 |
"version": "v0.13.0"
|
| 15 |
},
|
| 16 |
"model_info": {
|
| 17 |
+
"name": "RedHatAI/MiniMax-M2.5.w8a8",
|
| 18 |
+
"id": "RedHatAI/MiniMax-M2.5.w8a8",
|
| 19 |
+
"developer": "RedHatAI",
|
| 20 |
"inference_engine": {
|
| 21 |
"name": "vllm"
|
| 22 |
},
|
every_eval_ever/gsm8k_platinum_cot_llama.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
{
|
| 2 |
"schema_version": "0.2.2",
|
| 3 |
-
"evaluation_id": "gsm8k_platinum_cot_llama/
|
| 4 |
"evaluation_timestamp": "1777483916",
|
| 5 |
"retrieved_timestamp": "1777568615.837832",
|
| 6 |
"source_metadata": {
|
|
@@ -14,11 +14,11 @@
|
|
| 14 |
"version": "0.4.12.dev0"
|
| 15 |
},
|
| 16 |
"model_info": {
|
| 17 |
-
"name": "
|
| 18 |
-
"id": "
|
| 19 |
-
"developer": "
|
| 20 |
"additional_details": {
|
| 21 |
-
"model_args": "{'model': '
|
| 22 |
"seed": "1234",
|
| 23 |
"num_seeds_merged": "3"
|
| 24 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"schema_version": "0.2.2",
|
| 3 |
+
"evaluation_id": "gsm8k_platinum_cot_llama/RedHatAI/MiniMax-M2.5.w8a8/1777568615.837832",
|
| 4 |
"evaluation_timestamp": "1777483916",
|
| 5 |
"retrieved_timestamp": "1777568615.837832",
|
| 6 |
"source_metadata": {
|
|
|
|
| 14 |
"version": "0.4.12.dev0"
|
| 15 |
},
|
| 16 |
"model_info": {
|
| 17 |
+
"name": "RedHatAI/MiniMax-M2.5.w8a8",
|
| 18 |
+
"id": "RedHatAI/MiniMax-M2.5.w8a8",
|
| 19 |
+
"developer": "RedHatAI",
|
| 20 |
"additional_details": {
|
| 21 |
+
"model_args": "{'model': 'RedHatAI/MiniMax-M2.5.w8a8', 'max_length': 196608, 'base_url': 'http://0.0.0.0:8000/v1/chat/completions', 'num_concurrent': 128, 'max_retries': 3, 'tokenized_requests': False, 'tokenizer_backend': None, 'timeout': 2400}",
|
| 22 |
"seed": "1234",
|
| 23 |
"num_seeds_merged": "3"
|
| 24 |
}
|
every_eval_ever/ifeval.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
{
|
| 2 |
"schema_version": "0.2.2",
|
| 3 |
-
"evaluation_id": "ifeval/
|
| 4 |
"evaluation_timestamp": "1777485653",
|
| 5 |
"retrieved_timestamp": "1777568653.331068",
|
| 6 |
"source_metadata": {
|
|
@@ -14,11 +14,11 @@
|
|
| 14 |
"version": "0.4.12.dev0"
|
| 15 |
},
|
| 16 |
"model_info": {
|
| 17 |
-
"name": "
|
| 18 |
-
"id": "
|
| 19 |
-
"developer": "
|
| 20 |
"additional_details": {
|
| 21 |
-
"model_args": "{'model': '
|
| 22 |
"seed": "1234",
|
| 23 |
"num_seeds_merged": "3"
|
| 24 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"schema_version": "0.2.2",
|
| 3 |
+
"evaluation_id": "ifeval/RedHatAI/MiniMax-M2.5.w8a8/1777568653.331068",
|
| 4 |
"evaluation_timestamp": "1777485653",
|
| 5 |
"retrieved_timestamp": "1777568653.331068",
|
| 6 |
"source_metadata": {
|
|
|
|
| 14 |
"version": "0.4.12.dev0"
|
| 15 |
},
|
| 16 |
"model_info": {
|
| 17 |
+
"name": "RedHatAI/MiniMax-M2.5.w8a8",
|
| 18 |
+
"id": "RedHatAI/MiniMax-M2.5.w8a8",
|
| 19 |
+
"developer": "RedHatAI",
|
| 20 |
"additional_details": {
|
| 21 |
+
"model_args": "{'model': 'RedHatAI/MiniMax-M2.5.w8a8', 'max_length': 196608, 'base_url': 'http://0.0.0.0:8000/v1/chat/completions', 'num_concurrent': 128, 'max_retries': 3, 'tokenized_requests': False, 'tokenizer_backend': None, 'timeout': 2400}",
|
| 22 |
"seed": "1234",
|
| 23 |
"num_seeds_merged": "3"
|
| 24 |
}
|
every_eval_ever/math_500.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
{
|
| 2 |
"schema_version": "0.2.2",
|
| 3 |
-
"evaluation_id": "math_500/
|
| 4 |
"evaluation_timestamp": "7694693",
|
| 5 |
"retrieved_timestamp": "1777568712.013831",
|
| 6 |
"source_metadata": {
|
|
@@ -14,9 +14,9 @@
|
|
| 14 |
"version": "v0.13.0"
|
| 15 |
},
|
| 16 |
"model_info": {
|
| 17 |
-
"name": "
|
| 18 |
-
"id": "
|
| 19 |
-
"developer": "
|
| 20 |
"inference_engine": {
|
| 21 |
"name": "vllm"
|
| 22 |
},
|
|
|
|
| 1 |
{
|
| 2 |
"schema_version": "0.2.2",
|
| 3 |
+
"evaluation_id": "math_500/RedHatAI/MiniMax-M2.5.w8a8/1777568712.013831",
|
| 4 |
"evaluation_timestamp": "7694693",
|
| 5 |
"retrieved_timestamp": "1777568712.013831",
|
| 6 |
"source_metadata": {
|
|
|
|
| 14 |
"version": "v0.13.0"
|
| 15 |
},
|
| 16 |
"model_info": {
|
| 17 |
+
"name": "RedHatAI/MiniMax-M2.5.w8a8",
|
| 18 |
+
"id": "RedHatAI/MiniMax-M2.5.w8a8",
|
| 19 |
+
"developer": "RedHatAI",
|
| 20 |
"inference_engine": {
|
| 21 |
"name": "vllm"
|
| 22 |
},
|
every_eval_ever/mmlu_pro_chat.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
{
|
| 2 |
"schema_version": "0.2.2",
|
| 3 |
-
"evaluation_id": "mmlu_pro_chat/
|
| 4 |
"evaluation_timestamp": "1777572326",
|
| 5 |
"retrieved_timestamp": "1777980581.186022",
|
| 6 |
"source_metadata": {
|
|
@@ -14,11 +14,11 @@
|
|
| 14 |
"version": "0.4.12.dev0"
|
| 15 |
},
|
| 16 |
"model_info": {
|
| 17 |
-
"name": "
|
| 18 |
-
"id": "
|
| 19 |
-
"developer": "
|
| 20 |
"additional_details": {
|
| 21 |
-
"model_args": "{'model': '
|
| 22 |
"seed": "1234",
|
| 23 |
"num_seeds_merged": "3"
|
| 24 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"schema_version": "0.2.2",
|
| 3 |
+
"evaluation_id": "mmlu_pro_chat/RedHatAI/MiniMax-M2.5.w8a8/1777980581.186022",
|
| 4 |
"evaluation_timestamp": "1777572326",
|
| 5 |
"retrieved_timestamp": "1777980581.186022",
|
| 6 |
"source_metadata": {
|
|
|
|
| 14 |
"version": "0.4.12.dev0"
|
| 15 |
},
|
| 16 |
"model_info": {
|
| 17 |
+
"name": "RedHatAI/MiniMax-M2.5.w8a8",
|
| 18 |
+
"id": "RedHatAI/MiniMax-M2.5.w8a8",
|
| 19 |
+
"developer": "RedHatAI",
|
| 20 |
"additional_details": {
|
| 21 |
+
"model_args": "{'model': 'RedHatAI/MiniMax-M2.5.w8a8', 'max_length': 196608, 'base_url': 'http://0.0.0.0:8000/v1/chat/completions', 'num_concurrent': 28, 'max_retries': 3, 'tokenized_requests': False, 'tokenizer_backend': None, 'timeout': 2400}",
|
| 22 |
"seed": "1234",
|
| 23 |
"num_seeds_merged": "3"
|
| 24 |
}
|