curiositytech
/

MARS

@@ -7,76 +7,77 @@ base_model: meta-llama/Meta-Llama-3-8B-Instruct
 model-index:
 - name: MARS
   results:
-    - task:
-        type: text-generation
-        name: Text Generation
-      dataset:
-        name: AI2 Reasoning Challenge TR
-        type: ai2_arc
-        config: ARC-Challenge
-        split: test
-        args:
-          num_few_shot: 25
-      metrics:
-        - type: acc
-          value: 46.08
-          name: accuracy
-    - task:
-        type: text-generation
-        name: Text Generation
-      dataset:
-        name: MMLU TR
-        type: cais/mmlu
-        config: all
-        split: test
-        args:
-          num_few_shot: 5
-      metrics:
-        - type: acc
-          value: 47.02
-          name: accuracy
-    - task:
-        type: text-generation
-        name: Text Generation
-      dataset:
-        name: TruthfulQA TR
-        type: truthful_qa
-        config: multiple_choice
-        split: validation
-        args:
-          num_few_shot: 0
-      metrics:
-        - type: acc
-          name: accuracy
-          value: 49.38
-    - task:
-        type: text-generation
-        name: Text Generation
-      dataset:
-        name: Winogrande TR
-        type: winogrande
-        config: winogrande_xl
-        split: validation
-        args:
-          num_few_shot: 5
-      metrics:
-        - type: acc
-          value: 53.71
-          name: accuracy
-    - task:
-        type: text-generation
-        name: Text Generation
-      dataset:
-        name: GSM8k TR
-        type: gsm8k
-        config: main
-        split: test
-        args:
-          num_few_shot: 5
-      metrics:
-        - type: acc
-          value: 53.08
-          name: accuracy
 ---

 model-index:
 - name: MARS
   results:
+  - task:
+      type: text-generation
+      name: Text Generation
+    dataset:
+      name: AI2 Reasoning Challenge TR
+      type: ai2_arc
+      config: ARC-Challenge
+      split: test
+      args:
+        num_few_shot: 25
+    metrics:
+    - type: acc
+      value: 46.08
+      name: accuracy
+  - task:
+      type: text-generation
+      name: Text Generation
+    dataset:
+      name: MMLU TR
+      type: cais/mmlu
+      config: all
+      split: test
+      args:
+        num_few_shot: 5
+    metrics:
+    - type: acc
+      value: 47.02
+      name: accuracy
+  - task:
+      type: text-generation
+      name: Text Generation
+    dataset:
+      name: TruthfulQA TR
+      type: truthful_qa
+      config: multiple_choice
+      split: validation
+      args:
+        num_few_shot: 0
+    metrics:
+    - type: acc
+      name: accuracy
+      value: 49.38
+  - task:
+      type: text-generation
+      name: Text Generation
+    dataset:
+      name: Winogrande TR
+      type: winogrande
+      config: winogrande_xl
+      split: validation
+      args:
+        num_few_shot: 5
+    metrics:
+    - type: acc
+      value: 53.71
+      name: accuracy
+  - task:
+      type: text-generation
+      name: Text Generation
+    dataset:
+      name: GSM8k TR
+      type: gsm8k
+      config: main
+      split: test
+      args:
+        num_few_shot: 5
+    metrics:
+    - type: acc
+      value: 53.08
+      name: accuracy
+pipeline_tag: text-generation
 ---