bloomz
/
evaluation_bloomz
/evaluation_val
/wmt14_fr_en
/slim.limited=3000.model=xp3capmixnewcodelonglossseq_global_step498.task=wmt14_fr_en.templates=gpt3-fr-en.fewshot=0.batchsize=4.seed=1234.timestamp=2022-09-11T00:39:32.json
{ | |
"results": [ | |
{ | |
"task_name": "wmt14_fr_en", | |
"prompt_name": "gpt3-fr-en", | |
"bleu": 28.97671081332691, | |
"dataset_path": "wmt14", | |
"dataset_name": "fr-en", | |
"subset": null, | |
"bleu_stderr": 0.3781852673062757 | |
} | |
], | |
"config": { | |
"model": "hf-causal", | |
"model_args": "pretrained=/gpfsscratch/rech/six/commun/commun/experiments/muennighoff/bloomckpt/176bt0/xp3capmixnewcodelonglossseq_global_step498,use_accelerate=True,tokenizer=/gpfsscratch/rech/six/commun/commun/experiments/muennighoff/bloomckpt/176bt0/xp3capmixnewcodelonglossseq_global_step498,dtype=bfloat16", | |
"num_fewshot": 0, | |
"batch_size": 4, | |
"device": "cuda", | |
"use_cache": false, | |
"limit": 3000, | |
"bootstrap_iters": 10, | |
"seed": 1234 | |
} | |
} |