TongZheng1999's picture
Upload folder using huggingface_hub
2867a30 verified
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 0 score: 0.8037
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 1 score: 0.8955
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 2 score: 0.8598
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 3 score: 0.8753
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 4 score: 0.8860
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 5 score: 0.7282
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 6 score: 0.9288
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 7 score: 0.8856
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 8 score: 0.9076
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 9 score: 0.9053
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 10 score: 0.9157
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 11 score: 0.7933
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 12 score: 0.8758
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 13 score: 0.8823
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 14 score: 0.8845
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 15 score: 0.2519
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 16 score: 0.8626
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 17 score: 0.9371
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 18 score: 0.8325
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 19 score: 0.8873
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 20 score: 0.9230
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 21 score: 0.8934
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 22 score: 0.9278
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 23 score: 0.8589
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 24 score: 0.8773
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 25 score: 0.9209
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 26 score: 0.8507
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 27 score: 0.8283
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 28 score: 0.8405
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 29 score: 0.9091
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 30 score: 0.7933
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 31 score: 0.8383
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 32 score: 0.8900
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 33 score: 0.9328
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 34 score: 0.9174
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 35 score: 0.9126
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 36 score: 0.8159
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 37 score: 0.8860
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 38 score: 0.7763
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 39 score: 0.9146
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 40 score: 0.8582
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 41 score: 0.9666
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 42 score: 0.5230
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 43 score: 0.8734
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 44 score: 0.7362
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 45 score: 0.8924
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 46 score: 0.8535
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 47 score: 0.9267
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 48 score: 0.8077
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 49 score: 0.8717
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 50 score: 0.8978
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 51 score: 0.8753
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 52 score: 0.9151
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 53 score: 0.9357
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 54 score: 0.9017
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 55 score: 0.8019
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 56 score: 0.8785
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 57 score: 0.8566
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 58 score: 0.9065
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 59 score: 0.9361
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 60 score: 0.9184
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 61 score: 0.8653
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 62 score: 0.8795
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 63 score: 0.9156
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 64 score: 0.8474
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 65 score: 0.7176
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 66 score: 0.7443
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 67 score: 0.7680
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 68 score: 0.9114
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 69 score: 0.9140
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 70 score: 0.8951
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 71 score: 0.7553
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 72 score: 0.8744
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 73 score: 0.8800
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 74 score: 0.9010
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 75 score: 0.8797
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 76 score: 0.9228
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 77 score: 0.8039
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 78 score: 0.9717
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 79 score: 0.8496
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 80 score: 0.4433
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 81 score: 0.9067
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 82 score: 0.8704
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 83 score: 0.6399
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 84 score: 0.8927
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 85 score: 0.7391
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 86 score: 0.8198
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 87 score: 0.8979
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 88 score: 0.8878
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 89 score: 0.7105
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 90 score: 0.7739
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 91 score: 0.7803
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 92 score: 0.3861
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 93 score: 0.9309
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 94 score: 0.9261
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 95 score: 0.9264
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 96 score: 0.9205
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 97 score: 0.7154
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 98 score: 0.8978
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 99 score: 0.8542
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 100 score: 0.8506
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 101 score: 0.8310
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 102 score: 0.8927
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 103 score: 0.9637
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 104 score: 0.2592
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 105 score: 0.3412
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 106 score: 0.8765
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 107 score: 0.7326
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 108 score: 0.7969
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 109 score: 0.8025
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 110 score: 0.8778
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 111 score: 0.9419
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 112 score: 0.9407
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 113 score: 0.8630
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 114 score: 0.6932
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 115 score: 0.2605
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 116 score: 0.8842
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 117 score: 0.9231
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 118 score: 0.9194
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 119 score: 0.7786
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 120 score: 0.8739
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 121 score: 0.7667
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 122 score: 0.9211
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 123 score: 0.9606
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 124 score: 0.7645
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 125 score: 0.9114
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 126 score: 0.9057
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 127 score: 0.9097
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 128 score: 0.9214
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 129 score: 0.9152
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 130 score: 0.8224
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 131 score: 0.6644
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 132 score: 0.9099
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 133 score: 0.9428
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 134 score: 0.7515
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 135 score: 0.8297
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 136 score: 0.9346
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 137 score: 0.9073
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 138 score: 0.9323
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 139 score: 0.8718
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 140 score: 0.9057
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 141 score: 0.9258
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 142 score: 0.8636
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 143 score: 0.9367
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 144 score: 0.9064
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 145 score: 0.9147
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 146 score: 0.9516
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 147 score: 0.9374
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 148 score: 0.8808
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 149 score: 0.9232
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 150 score: 0.8718
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 151 score: 0.7301
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 152 score: 0.8496
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 153 score: 0.8040
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 154 score: 0.7635
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 155 score: 0.9010
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 156 score: 0.9131
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 157 score: 0.8356
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 158 score: 0.8256
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 159 score: 0.9279
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 160 score: 0.6863
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 161 score: 0.7794
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 162 score: 0.8631
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 163 score: 0.9146
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 164 score: 0.9322
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 165 score: 0.8066
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 166 score: 0.9096
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 167 score: 0.9119
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 168 score: 0.3007
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 169 score: 0.8257
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 170 score: 0.8179
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 171 score: 0.9367
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 172 score: 0.8980
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 173 score: 0.9290
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 174 score: 0.7205
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 175 score: 0.9253
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 176 score: 0.7994
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 177 score: 0.8647
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 178 score: 0.9220
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 179 score: 0.9011
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 180 score: 0.9091
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 181 score: 0.8872
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 182 score: 0.9488
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 183 score: 0.9388
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 184 score: 0.8979
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 185 score: 0.8985
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 186 score: 0.9260
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 187 score: 0.8278
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 188 score: 0.8588
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 189 score: 0.8225
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 190 score: 0.8475
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 191 score: 0.8974
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 192 score: 0.8986
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 193 score: 0.8495
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 194 score: 0.8693
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 195 score: 0.9213
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 196 score: 0.9154
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 197 score: 0.8010
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 198 score: 0.7922
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 199 score: 0.8738
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 200 score: 0.8113
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 201 score: 0.8038
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 202 score: 0.8185
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 203 score: 0.7874
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 204 score: 0.9043
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 205 score: 0.9079
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 206 score: 0.8271
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 207 score: 0.8092
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 208 score: 0.8781
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 209 score: 0.8404
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 210 score: 0.9510
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 211 score: 0.8921
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 212 score: 0.9017
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 213 score: 0.9310
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 214 score: 0.8675
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 215 score: 0.9175
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 216 score: 0.8059
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 217 score: 0.9243
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 218 score: 0.9377
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 219 score: 0.8299
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 220 score: 0.9427
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 221 score: 0.8912
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 222 score: 0.9322
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 223 score: 0.2915
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 224 score: 0.9436
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 225 score: 0.9584
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 226 score: 0.8639
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 227 score: 0.7326
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 228 score: 0.8428
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 229 score: 0.8522
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 230 score: 0.9426
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 231 score: 0.6101
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 232 score: 0.7245
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 233 score: 0.5952
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 234 score: 0.7890
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 235 score: 0.8574
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 236 score: 0.9218
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 237 score: 0.9117
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 238 score: 0.9229
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 239 score: 0.8550
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 240 score: 0.8342
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 241 score: 0.2805
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 242 score: 0.8394
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 243 score: 0.8237
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 244 score: 0.7847
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 245 score: 0.9210
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 246 score: 0.7604
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 247 score: 0.4200
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 248 score: 0.6859
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 249 score: 0.9618
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 250 score: 0.8939
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 251 score: 0.9269
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 252 score: 0.9426
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 253 score: 0.9212
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 254 score: 0.9422
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 255 score: 0.9495
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 256 score: 0.8393
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 257 score: 0.9104
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 258 score: 0.9230
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 259 score: 0.8972
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 260 score: 0.9312
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 261 score: 0.8238
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 262 score: 0.8809
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 263 score: 0.7790
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 264 score: 0.9287
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 265 score: 0.9092
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 266 score: 0.8873
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 267 score: 0.8801
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 268 score: 0.8991
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 269 score: 0.9170
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 270 score: 0.8225
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 271 score: 0.8152
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 272 score: 0.9078
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 273 score: 0.8697
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 274 score: 0.8295
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 275 score: 0.4001
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 276 score: 0.8406
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 277 score: 0.9507
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 278 score: 0.8791
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 279 score: 0.6679
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 280 score: 0.9022
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 281 score: 0.1932
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 282 score: 0.9376
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 283 score: 0.8284
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 284 score: 0.8889
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 285 score: 0.9068
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 286 score: 0.9382
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 287 score: 0.8544
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 288 score: 0.7830
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 289 score: 0.8540
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 290 score: 0.8716
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 291 score: 0.8998
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 292 score: 0.9244
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 293 score: 0.8478
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 294 score: 0.8490
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 295 score: 0.8940
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 296 score: 0.8359
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 297 score: 0.9413
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 298 score: 0.8246
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 299 score: 0.8996
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 300 score: 0.9267
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 301 score: 0.7647
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 302 score: 0.8883
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 303 score: 0.9372
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 304 score: 0.8584
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 305 score: 0.8239
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 306 score: 0.8624
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 307 score: 0.9207
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 308 score: 0.9414
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 309 score: 0.8827
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 310 score: 0.9534
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 311 score: 0.9340
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 312 score: 0.9242
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 313 score: 0.8657
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 314 score: 0.9557
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 315 score: 0.9594
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 316 score: 0.7053
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 317 score: 0.9033
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 318 score: 0.8598
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 319 score: 0.7950
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 320 score: 0.7793
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 321 score: 0.8544
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 322 score: 0.9157
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 323 score: 0.8941
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 324 score: 0.9307
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 325 score: 0.8720
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 326 score: 0.8526
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 327 score: 0.8810
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 328 score: 0.8999
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 329 score: 0.9396
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 330 score: 0.8877
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 331 score: 0.3057
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 332 score: 0.9501
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 333 score: 0.7422
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 334 score: 0.9797
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 335 score: 0.3863
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 336 score: 0.9218
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 337 score: 0.8753
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 338 score: 0.8445
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 339 score: 0.8785
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 340 score: 0.7961
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 341 score: 0.8431
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 342 score: 0.4473
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 343 score: 0.8208
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 344 score: 0.8692
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 345 score: 0.8486
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 346 score: 0.8989
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 347 score: 0.8254
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 348 score: 0.3127
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 349 score: 0.6858
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 350 score: 0.9184
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 351 score: 0.9345
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 352 score: 0.9198
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 353 score: 0.8551
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 354 score: 0.8794
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 355 score: 0.9260
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 356 score: 0.9291
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 357 score: 0.9197
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 358 score: 0.9042
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 359 score: 0.7860
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 360 score: 0.7225
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 361 score: 0.8724
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 362 score: 0.8789
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 363 score: 0.8403
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 364 score: 0.8838
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 365 score: 0.7733
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 366 score: 0.7238
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 367 score: 0.2422
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 368 score: 0.4313
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 369 score: 0.8146
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 370 score: 0.8334
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 371 score: 0.2628
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 372 score: 0.8593
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 373 score: 0.9089
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 374 score: 0.9364
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 375 score: 0.9177
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 376 score: 0.8911
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 377 score: 0.9148
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 378 score: 0.8774
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 379 score: 0.8861
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 380 score: 0.8980
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 381 score: 0.9230
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 382 score: 0.7013
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 383 score: 0.7283
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 384 score: 0.9260
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 385 score: 0.8220
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 386 score: 0.8248
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 387 score: 0.9042
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 388 score: 0.8720
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 389 score: 0.9329
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 390 score: 0.9370
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 391 score: 0.8232
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 392 score: 0.9177
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 393 score: 0.8810
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 394 score: 0.9540
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 395 score: 0.9711
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 396 score: 0.8477
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 397 score: 0.9435
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 398 score: 0.8549
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 399 score: 0.9343
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 400 score: 0.9579
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 401 score: 0.8173
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 402 score: 0.8289
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 403 score: 0.6956
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 404 score: 0.8070
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 405 score: 0.8490
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 406 score: 0.9224
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 407 score: 0.4117
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 408 score: 0.9251
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 409 score: 0.9290
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 410 score: 0.8930
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 411 score: 0.8349
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 412 score: 0.8360
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 413 score: 0.9258
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 414 score: 0.8687
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 415 score: 0.9199
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 416 score: 0.8000
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 417 score: 0.8572
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 418 score: 0.9249
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 419 score: 0.8856
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 420 score: 0.9441
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 421 score: 0.9239
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 422 score: 0.6896
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 423 score: 0.8498
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 424 score: 0.8918
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 425 score: 0.9357
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 426 score: 0.9196
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 427 score: 0.9055
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 428 score: 0.9155
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 429 score: 0.9494
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 430 score: 0.7845
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 431 score: 0.8198
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 432 score: 0.8286
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 433 score: 0.8670
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 434 score: 0.7174
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 435 score: 0.8944
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 436 score: 0.8720
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 437 score: 0.8900
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 438 score: 0.9465
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 439 score: 0.9230
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 440 score: 0.9213
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 441 score: 0.9187
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 442 score: 0.9592
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 443 score: 0.9213
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 444 score: 0.8015
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 445 score: 0.8896
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 446 score: 0.9318
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 447 score: 0.8686
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 448 score: 0.8709
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 449 score: 0.8440
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 450 score: 0.9212
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 451 score: 0.9252
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 452 score: 0.9400
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 453 score: 0.9249
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 454 score: 0.8817
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 455 score: 0.9126
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 456 score: 0.6301
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 457 score: 0.9424
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 458 score: 0.8877
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 459 score: 0.8903
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 460 score: 0.9096
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 461 score: 0.8892
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 462 score: 0.8147
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 463 score: 0.9424
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 464 score: 0.9176
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 465 score: 0.8556
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 466 score: 0.9324
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 467 score: 0.7645
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 468 score: 0.6203
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 469 score: 0.7615
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 470 score: 0.7080
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 471 score: 0.8549
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 472 score: 0.7478
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 473 score: 0.6823
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 474 score: 0.7851
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 475 score: 0.9343
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 476 score: 0.7876
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 477 score: 0.9206
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 478 score: 0.8572
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 479 score: 0.9261
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 480 score: 0.8850
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 481 score: 0.8503
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 482 score: 0.8617
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 483 score: 0.9056
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 484 score: 0.9102
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 485 score: 0.7774
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 486 score: 0.8908
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 487 score: 0.8585
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 488 score: 0.9288
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 489 score: 0.8311
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 490 score: 0.8246
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 491 score: 0.9300
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 492 score: 0.9630
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 493 score: 0.9439
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 494 score: 0.8371
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 495 score: 0.9034
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 496 score: 0.8982
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 497 score: 0.8415
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 498 score: 0.8627
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 499 score: 0.8909
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 500 score: 0.9367
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 501 score: 0.9505
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 502 score: 0.9122
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 503 score: 0.8977
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 504 score: 0.7709
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 505 score: 0.9321
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 506 score: 0.8013
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 507 score: 0.7540
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 508 score: 0.8238
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 509 score: 0.7615
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 510 score: 0.7531
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 511 score: 0.8581
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 512 score: 0.2668
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 513 score: 0.7963
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 514 score: 0.7723
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 515 score: 0.8104
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 516 score: 0.7035
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 517 score: 0.9117
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 518 score: 0.9112
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 519 score: 0.9409
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 520 score: 0.9059
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 521 score: 0.8907
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 522 score: 0.8940
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 523 score: 0.8156
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 524 score: 0.9176
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 525 score: 0.8508
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 526 score: 0.7396
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 527 score: 0.7338
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 528 score: 0.8182
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 529 score: 0.9088
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 530 score: 0.7691
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 531 score: 0.8635
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 532 score: 0.7656
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 533 score: 0.2816
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 534 score: 0.8353
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 535 score: 0.5194
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 536 score: 0.7347
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 537 score: 0.8901
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 538 score: 0.8541
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 539 score: 0.9166
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 540 score: 0.9004
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 541 score: 0.9265
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 542 score: 0.8949
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 543 score: 0.8911
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 544 score: 0.9025
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 545 score: 0.8658
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 546 score: 0.8883
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 547 score: 0.9154
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 548 score: 0.8470
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 549 score: 0.9474
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 550 score: 0.8774
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 551 score: 0.9274
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 552 score: 0.9225
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 553 score: 0.8910
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 554 score: 0.9371
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 555 score: 0.6780
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 556 score: 0.7216
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 557 score: 0.8629
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 558 score: 0.5984
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 559 score: 0.8700
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 560 score: 0.8438
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 561 score: 0.9135
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 562 score: 0.8660
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 563 score: 0.8410
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 564 score: 0.8279
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 565 score: 0.9502
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 566 score: 0.9109
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 567 score: 0.9220
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 568 score: 0.8567
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 569 score: 0.7593
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 570 score: 0.9228
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 571 score: 0.9350
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 572 score: 0.8419
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 573 score: 0.9090
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 574 score: 0.8643
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 575 score: 0.7879
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 576 score: 0.8330
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 577 score: 0.8742
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 578 score: 0.9176
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 579 score: 0.5630
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 580 score: 0.8380
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 581 score: 0.8515
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 582 score: 0.8581
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 583 score: 0.8144
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 584 score: 0.6554
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 585 score: 0.8824
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 586 score: 0.8744
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 587 score: 0.7757
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 588 score: 0.8245
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 589 score: 0.9109
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 590 score: 0.9188
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 591 score: 0.9507
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 592 score: 0.7963
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 593 score: 0.9204
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 594 score: 0.9141
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 595 score: 0.8670
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 596 score: 0.8950
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 597 score: 0.7809
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 598 score: 0.8335
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 599 score: 0.9483
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 600 score: 0.8896
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 601 score: 0.7983
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 602 score: 0.8317
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 603 score: 0.8175
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 604 score: 0.9223
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 605 score: 0.9427
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 606 score: 0.8175
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 607 score: 0.6474
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 608 score: 0.7267
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 609 score: 0.8648
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 610 score: 0.9541
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 611 score: 0.8525
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 612 score: 0.9080
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 613 score: 0.8945
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 614 score: 0.9417
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 615 score: 0.8992
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 616 score: 0.9522
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 617 score: 0.9619
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 618 score: 0.9133
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 619 score: 0.8656
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 620 score: 0.8400
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 621 score: 0.8694
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 622 score: 0.9304
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 623 score: 0.8815
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 624 score: 0.8425
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 625 score: 0.9316
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 626 score: 0.9638
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 627 score: 0.9463
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 628 score: 0.8687
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 629 score: 0.8601
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 630 score: 0.8854
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 631 score: 0.9513
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 632 score: 0.9538
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 633 score: 0.9338
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 634 score: 0.9632
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 635 score: 0.9337
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 636 score: 0.9072
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 637 score: 0.8699
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 638 score: 0.8736
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 639 score: 0.9449
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 640 score: 0.9530
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 641 score: 0.9697
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 642 score: 0.8520
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 643 score: 0.6904
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 644 score: 0.3734
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 645 score: 0.7712
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 646 score: 0.8906
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 647 score: 0.8535
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 648 score: 0.1965
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 649 score: 0.8227
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 650 score: 0.8488
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 651 score: 0.8085
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 652 score: 0.3099
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 653 score: 0.2674
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 654 score: 0.8415
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 655 score: 0.8839
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 656 score: 0.7699
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 657 score: 0.8997
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 658 score: 0.7646
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 659 score: 0.8673
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 660 score: 0.8421
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 661 score: 0.9407
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 662 score: 0.9193
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 663 score: 0.8511
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 664 score: 0.8795
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 665 score: 0.8542
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 666 score: 0.8379
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 667 score: 0.8121
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 668 score: 0.9342
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 669 score: 0.9190
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 670 score: 0.9199
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 671 score: 0.9309
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 672 score: 0.9013
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 673 score: 0.8871
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 674 score: 0.9511
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 675 score: 0.7943
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 676 score: 0.9020
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 677 score: 0.8671
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 678 score: 0.9126
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 679 score: 0.9482
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 680 score: 0.8766
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 681 score: 0.9307
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 682 score: 0.9403
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 683 score: 0.8930
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 684 score: 0.8634
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 685 score: 0.8642
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 686 score: 0.9079
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 687 score: 0.9095
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 688 score: 0.9385
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 689 score: 0.8528
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 690 score: 0.9049
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 691 score: 0.8735
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 692 score: 0.9178
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 693 score: 0.8317
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 694 score: 0.8652
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 695 score: 0.8855
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 696 score: 0.9469
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 697 score: 0.9196
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 698 score: 0.8504
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 699 score: 0.9566
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 700 score: 0.9008
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 701 score: 0.8630
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 702 score: 0.8912
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 703 score: 0.8880
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 704 score: 0.8406
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 705 score: 0.8463
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 706 score: 0.7914
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 707 score: 0.9121
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 708 score: 0.9278
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 709 score: 0.8985
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 710 score: 0.8827
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 711 score: 0.8483
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 712 score: 0.9477
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 713 score: 0.8808
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 714 score: 0.8794
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 715 score: 0.7870
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 716 score: 0.7245
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 717 score: 0.8602
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 718 score: 0.9120
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 719 score: 0.4351
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 720 score: 0.8737
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 721 score: 0.8332
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 722 score: 0.9403
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 723 score: 0.9162
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 724 score: 0.9445
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 725 score: 0.9499
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 726 score: 0.8886
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 727 score: 0.8816
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 728 score: 0.4320
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 729 score: 0.8825
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 730 score: 0.9017
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 731 score: 0.9156
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 732 score: 0.8747
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 733 score: 0.8595
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 734 score: 0.8364
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 735 score: 0.8950
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 736 score: 0.9252
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 737 score: 0.8770
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 738 score: 0.8839
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 739 score: 0.8909
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 740 score: 0.8790
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 741 score: 0.7081
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 742 score: 0.8676
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 743 score: 0.8594
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 744 score: 0.8298
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 745 score: 0.5304
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 746 score: 0.8853
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 747 score: 0.8970
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 748 score: 0.9493
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 749 score: 0.9231
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 750 score: 0.8917
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 751 score: 0.8946
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 752 score: 0.8696
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 753 score: 0.9078
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 754 score: 0.8901
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 755 score: 0.8984
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 756 score: 0.9120
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 757 score: 0.8868
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 758 score: 0.9034
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 759 score: 0.8644
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 760 score: 0.9322
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 761 score: 0.7534
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 762 score: 0.8413
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 763 score: 0.8518
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 764 score: 0.8560
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 765 score: 0.7582
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 766 score: 0.9275
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 767 score: 0.8792
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 768 score: 0.9436
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 769 score: 0.9668
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 770 score: 0.9215
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 771 score: 0.9076
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 772 score: 0.8318
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 773 score: 0.8984
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 774 score: 0.9192
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 775 score: 0.8607
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 776 score: 0.8464
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 777 score: 0.8736
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 778 score: 0.8436
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 779 score: 0.8675
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 780 score: 0.6862
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 781 score: 0.2197
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 782 score: 0.8828
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 783 score: 0.7427
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 784 score: 0.9151
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 785 score: 0.7551
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 786 score: 0.9055
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 787 score: 0.8609
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 788 score: 0.8630
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 789 score: 0.8984
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 790 score: 0.8452
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 791 score: 0.8055
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 792 score: 0.9131
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 793 score: 0.8455
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 794 score: 0.7296
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 795 score: 0.8674
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 796 score: 0.9590
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 797 score: 0.8014
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 798 score: 0.9089
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 799 score: 0.9134
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 800 score: 0.8415
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 801 score: 0.9027
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 802 score: 0.8644
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 803 score: 0.8564
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 804 score: 0.6326
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 805 score: 0.7909
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 806 score: 0.8376
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 807 score: 0.9153
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 808 score: 0.8722
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 809 score: 0.8859
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 810 score: 0.6543
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 811 score: 0.6919
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 812 score: 0.9357
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 813 score: 0.8748
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 814 score: 0.7975
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 815 score: 0.7430
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 816 score: 0.9035
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 817 score: 0.3280
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 818 score: 0.4807
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 819 score: 0.8132
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 820 score: 0.9243
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 821 score: 0.9249
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 822 score: 0.8673
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 823 score: 0.8644
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 824 score: 0.9081
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 825 score: 0.9118
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 826 score: 0.9352
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 827 score: 0.8944
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 828 score: 0.8965
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 829 score: 0.8030
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 830 score: 0.9047
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 831 score: 0.7939
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 832 score: 0.8702
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 833 score: 0.6952
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 834 score: 0.1910
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 835 score: 0.8057
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 836 score: 0.7129
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 837 score: 0.6576
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 838 score: 0.8559
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 839 score: 0.8533
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 840 score: 0.8770
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 841 score: 0.8344
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 842 score: 0.3831
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 843 score: 0.8951
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 844 score: 0.6916
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 845 score: 0.6365
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 846 score: 0.6871
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 847 score: 0.8496
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 848 score: 0.7272
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 849 score: 0.8310
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 850 score: 0.8103
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 851 score: 0.8923
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 852 score: 0.9214
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 853 score: 0.9335
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 854 score: 0.8125
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 855 score: 0.8960
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 856 score: 0.7898
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 857 score: 0.9392
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 858 score: 0.7210
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 859 score: 0.9076
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 860 score: 0.9276
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 861 score: 0.9199
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 862 score: 0.8040
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 863 score: 0.7662
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 864 score: 0.8927
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 865 score: 0.8361
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 866 score: 0.8944
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 867 score: 0.8041
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 868 score: 0.9435
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 869 score: 0.8605
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 870 score: 0.9224
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 871 score: 0.9332
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 872 score: 0.8715
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 873 score: 0.8799
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 874 score: 0.9253
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 875 score: 0.8307
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 876 score: 0.9099
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 877 score: 0.6873
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 878 score: 0.9196
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 879 score: 0.8892
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 880 score: 0.8862
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 881 score: 0.2838
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 882 score: 0.9396
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 883 score: 0.9202
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 884 score: 0.8275
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 885 score: 0.8952
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 886 score: 0.8682
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 887 score: 0.8301
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 888 score: 0.7455
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 889 score: 0.8278
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 890 score: 0.8111
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 891 score: 0.7842
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 892 score: 0.2333
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 893 score: 0.9126
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 894 score: 0.8062
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 895 score: 0.9001
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 896 score: 0.9249
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 897 score: 0.8838
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 898 score: 0.9271
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 899 score: 0.8940
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 900 score: 0.9203
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 901 score: 0.9004
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 902 score: 0.7166
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 903 score: 0.8760
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 904 score: 0.9036
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 905 score: 0.8918
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 906 score: 0.9219
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 907 score: 0.8244
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 908 score: 0.8680
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 909 score: 0.9093
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 910 score: 0.8704
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 911 score: 0.7924
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 912 score: 0.9023
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 913 score: 0.8471
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 914 score: 0.8721
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 915 score: 0.8668
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 916 score: 0.9008
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 917 score: 0.8444
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 918 score: 0.9218
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 919 score: 0.8299
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 920 score: 0.8173
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 921 score: 0.8188
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 922 score: 0.9068
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 923 score: 0.3417
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 924 score: 0.9185
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 925 score: 0.8804
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 926 score: 0.8603
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 927 score: 0.8433
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 928 score: 0.9099
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 929 score: 0.8843
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 930 score: 0.8743
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 931 score: 0.7817
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 932 score: 0.7926
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 933 score: 0.7723
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 934 score: 0.8119
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 935 score: 0.8449
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 936 score: 0.7527
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 937 score: 0.9484
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 938 score: 0.9524
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 939 score: 0.8527
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 940 score: 0.9246
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 941 score: 0.9485
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 942 score: 0.9454
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 943 score: 0.9178
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 944 score: 0.7985
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 945 score: 0.8990
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 946 score: 0.8016
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 947 score: 0.9098
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 948 score: 0.8870
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 949 score: 0.9287
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 950 score: 0.8834
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 951 score: 0.7767
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 952 score: 0.8499
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 953 score: 0.8464
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 954 score: 0.8014
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 955 score: 0.9226
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 956 score: 0.9094
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 957 score: 0.9654
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 958 score: 0.8802
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 959 score: 0.8905
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 960 score: 0.8121
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 961 score: 0.7538
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 962 score: 0.8693
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 963 score: 0.8089
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 964 score: 0.9340
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 965 score: 0.7964
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 966 score: 0.8874
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 967 score: 0.7641
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 968 score: 0.7709
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 969 score: 0.7971
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 970 score: 0.9091
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 971 score: 0.2698
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 972 score: 0.7336
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 973 score: 0.8998
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 974 score: 0.8900
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 975 score: 0.9134
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 976 score: 0.8878
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 977 score: 0.8946
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 978 score: 0.9303
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 979 score: 0.9126
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 980 score: 0.8275
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 981 score: 0.9160
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 982 score: 0.9167
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 983 score: 0.8546
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 984 score: 0.9067
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 985 score: 0.9007
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 986 score: 0.8538
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 987 score: 0.8857
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 988 score: 0.7932
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 989 score: 0.7692
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 990 score: 0.9499
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 991 score: 0.5385
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 992 score: 0.8878
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 993 score: 0.8714
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 994 score: 0.8870
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 995 score: 0.8791
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 996 score: 0.8746
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 997 score: 0.9587
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 998 score: 0.8405
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 999 score: 0.7963
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 1000 score: 0.9085
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 1001 score: 0.4256
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 1002 score: 0.8531
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 1003 score: 0.8822
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 1004 score: 0.9027
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 1005 score: 0.9254
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 1006 score: 0.9012
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 1007 score: 0.8820
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 1008 score: 0.4178
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 1009 score: 0.8832
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 1010 score: 0.8981
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko Segment 1011 score: 0.8715
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/group_training/alma-13b-sft-group-6-max-tokens-512//test-en-ko score: 0.8444