diff --git "a/logs/l40-4gpu-8.txt" "b/logs/l40-4gpu-8.txt" --- "a/logs/l40-4gpu-8.txt" +++ "b/logs/l40-4gpu-8.txt" @@ -312,4 +312,7 @@ Qwen/Qwen2-72B-Instruct/checkpoint-560/rpp-1.02 metrics: {'meteor': 0.4796836675 Batch output: ['Old Geng raised his gun, squinted with one of his triangular eyes, and pulled the trigger. The hail of golden sparrows fell to the ground in a flurry, and bits of shot flew through the branches with a rustling sound.'] Qwen/Qwen2-72B-Instruct/checkpoint-560/rpp-1.04 metrics: {'meteor': 0.476362681282195, 'sacrebleu': {'score': 18.52063321160408, 'counts': [14564, 6684, 3677, 2141], 'totals': [27967, 26834, 25701, 24572], 'precisions': [52.07566059999285, 24.90869792054856, 14.306836309871212, 8.71316946117532], 'bp': 0.9235904535319178, 'sys_len': 27967, 'ref_len': 30190}, 'bleu_scores': {'bleu': 0.1852063321160408, 'precisions': [0.5207566059999285, 0.2490869792054856, 0.14306836309871213, 0.08713169461175321], 'brevity_penalty': 0.9235904535319178, 'length_ratio': 0.9263663464723418, 'translation_length': 27967, 'reference_length': 30190}, 'rouge_scores': {'rouge1': 0.5044329272755532, 'rouge2': 0.2644353224493149, 'rougeL': 0.4486941551906956, 'rougeLsum': 0.44880487550215126}, 'accuracy': 0.01323918799646955, 'correct_ids': [41, 77, 133, 193, 199, 272, 348, 364, 413, 567, 658, 712, 778, 893, 1011]} *** Evaluating with repetition_penalty: 1.06 - 0%| | 0/1133 [00:00