{ | |
"results": { | |
"gsm8k": { | |
"acc": 0.047763457164518575, | |
"acc_stderr": 0.005874387536229333 | |
} | |
}, | |
"versions": { | |
"gsm8k": 0 | |
}, | |
"config": { | |
"model": "sparseml", | |
"model_args": "pretrained=/network/alexandre/research/cerebras/llama2_7B_sparse70_retrained/ultrachat200k/llama2_7B_sparse70_LR3e-4_GC2_E2/training,dtype=bfloat16", | |
"num_fewshot": 5, | |
"batch_size": "16", | |
"batch_sizes": [], | |
"device": "cuda:6", | |
"no_cache": true, | |
"limit": null, | |
"bootstrap_iters": 100000, | |
"description_dict": {} | |
} | |
} |