File size: 668 Bytes
dd8cf92
 
f8ae921
 
 
 
46bcca0
 
b79c971
 
f8ae921
b25a00b
 
46bcca0
 
 
 
 
 
f8ae921
 
 
 
2561b63
f8ae921
 
11257ec
 
 
f8ae921
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
group:
  - halueval
task: halueval_qa
dataset_path: pminervini/HaluEval
dataset_name: qa_samples
output_type: generate_until
training_split: null
validation_split: null
test_split: data
num_fewshot: 0
doc_to_text: !function utils.doc_to_text_qa
doc_to_target: !function utils.doc_to_target
process_results: !function utils.process_results
generation_kwargs:
  until:
    - "\n"
    - "."
  do_sample: false
  temperature: 0.0
metric_list:
  - metric: em
    aggregation: mean
    higher_is_better: true
  - metric: correctness
    aggregation: mean
    higher_is_better: true
  - metric: acc
    aggregation: mean
    higher_is_better: true
metadata:
  - version: 0.0