diff --git "a/test-en-vi.comet" "b/test-en-vi.comet" new file mode 100644--- /dev/null +++ "b/test-en-vi.comet" @@ -0,0 +1,1013 @@ +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 0 score: 0.8681 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 1 score: 0.9029 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 2 score: 0.8980 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 3 score: 0.8467 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 4 score: 0.8498 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 5 score: 0.6467 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 6 score: 0.8603 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 7 score: 0.8855 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 8 score: 0.9715 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 9 score: 0.8972 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 10 score: 0.9220 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 11 score: 0.8713 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 12 score: 0.8846 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 13 score: 0.8926 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 14 score: 0.8767 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 15 score: 0.7438 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 16 score: 0.8691 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 17 score: 0.9336 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 18 score: 0.9055 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 19 score: 0.8996 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 20 score: 0.9519 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 21 score: 0.9442 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 22 score: 0.8221 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 23 score: 0.8734 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 24 score: 0.9246 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 25 score: 0.9128 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 26 score: 0.8036 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 27 score: 0.7699 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 28 score: 0.8751 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 29 score: 0.9180 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 30 score: 0.7876 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 31 score: 0.7279 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 32 score: 0.8419 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 33 score: 0.9231 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 34 score: 0.8847 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 35 score: 0.9483 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 36 score: 0.8914 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 37 score: 0.8481 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 38 score: 0.8401 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 39 score: 0.9138 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 40 score: 0.8750 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 41 score: 0.9479 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 42 score: 0.7994 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 43 score: 0.9202 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 44 score: 0.8405 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 45 score: 0.9124 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 46 score: 0.8804 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 47 score: 0.8992 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 48 score: 0.8952 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 49 score: 0.8059 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 50 score: 0.9163 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 51 score: 0.9019 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 52 score: 0.9218 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 53 score: 0.9408 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 54 score: 0.9082 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 55 score: 0.8964 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 56 score: 0.9051 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 57 score: 0.8478 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 58 score: 0.8592 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 59 score: 0.9586 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 60 score: 0.8782 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 61 score: 0.9427 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 62 score: 0.9002 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 63 score: 0.9181 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 64 score: 0.8851 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 65 score: 0.7310 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 66 score: 0.7363 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 67 score: 0.6353 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 68 score: 0.9448 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 69 score: 0.9169 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 70 score: 0.8697 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 71 score: 0.8597 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 72 score: 0.8702 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 73 score: 0.8174 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 74 score: 0.9053 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 75 score: 0.8667 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 76 score: 0.9098 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 77 score: 0.9228 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 78 score: 0.9339 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 79 score: 0.9017 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 80 score: 0.8477 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 81 score: 0.9206 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 82 score: 0.8651 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 83 score: 0.7120 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 84 score: 0.8862 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 85 score: 0.8760 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 86 score: 0.8267 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 87 score: 0.8879 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 88 score: 0.8943 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 89 score: 0.8267 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 90 score: 0.8433 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 91 score: 0.8689 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 92 score: 0.8250 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 93 score: 0.9516 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 94 score: 0.9328 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 95 score: 0.9163 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 96 score: 0.9127 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 97 score: 0.9186 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 98 score: 0.9294 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 99 score: 0.8505 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 100 score: 0.9159 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 101 score: 0.8756 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 102 score: 0.8733 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 103 score: 0.8988 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 104 score: 0.9157 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 105 score: 0.8956 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 106 score: 0.9369 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 107 score: 0.8062 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 108 score: 0.6440 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 109 score: 0.7740 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 110 score: 0.8192 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 111 score: 0.9086 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 112 score: 0.9451 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 113 score: 0.9206 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 114 score: 0.8717 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 115 score: 0.8484 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 116 score: 0.8799 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 117 score: 0.8934 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 118 score: 0.9727 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 119 score: 0.8103 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 120 score: 0.7941 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 121 score: 0.9147 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 122 score: 0.9462 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 123 score: 0.9344 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 124 score: 0.9459 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 125 score: 0.9035 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 126 score: 0.9186 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 127 score: 0.9088 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 128 score: 0.8912 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 129 score: 0.9385 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 130 score: 0.9147 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 131 score: 0.8392 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 132 score: 0.8955 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 133 score: 0.9241 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 134 score: 0.7644 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 135 score: 0.1836 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 136 score: 0.9301 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 137 score: 0.7779 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 138 score: 0.8834 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 139 score: 0.8864 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 140 score: 0.9244 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 141 score: 0.8946 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 142 score: 0.9413 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 143 score: 0.9213 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 144 score: 0.9436 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 145 score: 0.9237 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 146 score: 0.9320 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 147 score: 0.9265 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 148 score: 0.9206 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 149 score: 0.9403 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 150 score: 0.9203 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 151 score: 0.8750 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 152 score: 0.8130 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 153 score: 0.8873 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 154 score: 0.7806 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 155 score: 0.8780 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 156 score: 0.8901 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 157 score: 0.7877 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 158 score: 0.9151 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 159 score: 0.9145 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 160 score: 0.8709 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 161 score: 0.7750 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 162 score: 0.8353 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 163 score: 0.9096 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 164 score: 0.8858 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 165 score: 0.7789 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 166 score: 0.9331 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 167 score: 0.9079 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 168 score: 0.8861 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 169 score: 0.8834 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 170 score: 0.8739 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 171 score: 0.9118 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 172 score: 0.9436 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 173 score: 0.8054 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 174 score: 0.9265 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 175 score: 0.9435 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 176 score: 0.8459 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 177 score: 0.9107 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 178 score: 0.7581 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 179 score: 0.9222 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 180 score: 0.8183 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 181 score: 0.8881 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 182 score: 0.8877 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 183 score: 0.9118 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 184 score: 0.2641 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 185 score: 0.9519 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 186 score: 0.9369 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 187 score: 0.8029 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 188 score: 0.8688 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 189 score: 0.8141 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 190 score: 0.7501 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 191 score: 0.8939 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 192 score: 0.8980 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 193 score: 0.8740 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 194 score: 0.8698 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 195 score: 0.8908 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 196 score: 0.8068 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 197 score: 0.8109 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 198 score: 0.9116 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 199 score: 0.8213 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 200 score: 0.7891 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 201 score: 0.7942 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 202 score: 0.7992 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 203 score: 0.8323 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 204 score: 0.8495 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 205 score: 0.8693 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 206 score: 0.9047 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 207 score: 0.8694 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 208 score: 0.9005 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 209 score: 0.9276 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 210 score: 0.9406 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 211 score: 0.9010 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 212 score: 0.9025 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 213 score: 0.9323 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 214 score: 0.9266 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 215 score: 0.9272 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 216 score: 0.9167 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 217 score: 0.9371 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 218 score: 0.9411 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 219 score: 0.8846 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 220 score: 0.9602 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 221 score: 0.9171 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 222 score: 0.9240 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 223 score: 0.9154 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 224 score: 0.9448 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 225 score: 0.9213 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 226 score: 0.9354 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 227 score: 0.8306 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 228 score: 0.8216 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 229 score: 0.8948 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 230 score: 0.9742 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 231 score: 0.8825 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 232 score: 0.8713 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 233 score: 0.8143 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 234 score: 0.8379 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 235 score: 0.8660 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 236 score: 0.9138 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 237 score: 0.8612 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 238 score: 0.9260 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 239 score: 0.9474 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 240 score: 0.8015 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 241 score: 0.7131 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 242 score: 0.8770 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 243 score: 0.7654 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 244 score: 0.7922 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 245 score: 0.8289 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 246 score: 0.7849 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 247 score: 0.7221 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 248 score: 0.8345 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 249 score: 0.9577 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 250 score: 0.8923 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 251 score: 0.9445 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 252 score: 0.9317 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 253 score: 0.9348 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 254 score: 0.9312 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 255 score: 0.9400 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 256 score: 0.8331 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 257 score: 0.9254 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 258 score: 0.9159 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 259 score: 0.8472 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 260 score: 0.9381 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 261 score: 0.8570 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 262 score: 0.9238 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 263 score: 0.6572 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 264 score: 0.9215 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 265 score: 0.8979 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 266 score: 0.8512 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 267 score: 0.8606 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 268 score: 0.9328 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 269 score: 0.8848 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 270 score: 0.8288 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 271 score: 0.8386 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 272 score: 0.8902 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 273 score: 0.8343 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 274 score: 0.8086 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 275 score: 0.7899 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 276 score: 0.7822 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 277 score: 0.8892 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 278 score: 0.9032 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 279 score: 0.9268 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 280 score: 0.9200 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 281 score: 0.9597 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 282 score: 0.8088 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 283 score: 0.8717 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 284 score: 0.9282 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 285 score: 0.9554 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 286 score: 0.8986 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 287 score: 0.9049 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 288 score: 0.8461 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 289 score: 0.9127 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 290 score: 0.8828 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 291 score: 0.8746 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 292 score: 0.9149 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 293 score: 0.9232 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 294 score: 0.7770 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 295 score: 0.6961 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 296 score: 0.8643 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 297 score: 0.8858 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 298 score: 0.6548 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 299 score: 0.8539 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 300 score: 0.9005 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 301 score: 0.8620 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 302 score: 0.8602 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 303 score: 0.9614 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 304 score: 0.8919 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 305 score: 0.8482 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 306 score: 0.9359 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 307 score: 0.8861 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 308 score: 0.9119 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 309 score: 0.9352 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 310 score: 0.9117 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 311 score: 0.9053 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 312 score: 0.8703 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 313 score: 0.7478 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 314 score: 0.9211 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 315 score: 0.9283 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 316 score: 0.8779 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 317 score: 0.8537 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 318 score: 0.8457 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 319 score: 0.7478 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 320 score: 0.8341 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 321 score: 0.8060 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 322 score: 0.9173 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 323 score: 0.9266 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 324 score: 0.9404 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 325 score: 0.9130 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 326 score: 0.7331 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 327 score: 0.8121 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 328 score: 0.9101 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 329 score: 0.9125 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 330 score: 0.9119 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 331 score: 0.8847 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 332 score: 0.9022 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 333 score: 0.7709 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 334 score: 0.9543 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 335 score: 0.9157 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 336 score: 0.8875 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 337 score: 0.8393 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 338 score: 0.8271 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 339 score: 0.9262 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 340 score: 0.7975 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 341 score: 0.8897 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 342 score: 0.6517 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 343 score: 0.7711 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 344 score: 0.8610 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 345 score: 0.8713 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 346 score: 0.9426 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 347 score: 0.8844 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 348 score: 0.8047 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 349 score: 0.8341 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 350 score: 0.8101 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 351 score: 0.8873 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 352 score: 0.8551 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 353 score: 0.9069 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 354 score: 0.9255 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 355 score: 0.8851 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 356 score: 0.9158 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 357 score: 0.8996 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 358 score: 0.9467 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 359 score: 0.7089 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 360 score: 0.8738 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 361 score: 0.8827 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 362 score: 0.9004 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 363 score: 0.8752 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 364 score: 0.8768 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 365 score: 0.8662 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 366 score: 0.8016 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 367 score: 0.7869 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 368 score: 0.4525 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 369 score: 0.8298 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 370 score: 0.7489 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 371 score: 0.7420 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 372 score: 0.8637 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 373 score: 0.8903 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 374 score: 0.8725 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 375 score: 0.8054 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 376 score: 0.9328 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 377 score: 0.9227 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 378 score: 0.7409 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 379 score: 0.8866 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 380 score: 0.9395 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 381 score: 0.8027 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 382 score: 0.7661 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 383 score: 0.8267 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 384 score: 0.8685 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 385 score: 0.8214 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 386 score: 0.7361 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 387 score: 0.8990 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 388 score: 0.7938 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 389 score: 0.9186 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 390 score: 0.8653 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 391 score: 0.9083 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 392 score: 0.7586 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 393 score: 0.8944 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 394 score: 0.8775 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 395 score: 0.8907 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 396 score: 0.7159 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 397 score: 0.9478 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 398 score: 0.7922 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 399 score: 0.9140 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 400 score: 0.9380 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 401 score: 0.8082 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 402 score: 0.9445 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 403 score: 0.7864 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 404 score: 0.8095 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 405 score: 0.7641 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 406 score: 0.9065 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 407 score: 0.9258 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 408 score: 0.9284 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 409 score: 0.9126 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 410 score: 0.9285 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 411 score: 0.8657 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 412 score: 0.7749 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 413 score: 0.8996 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 414 score: 0.8705 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 415 score: 0.8843 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 416 score: 0.9128 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 417 score: 0.8513 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 418 score: 0.9351 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 419 score: 0.8909 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 420 score: 0.9147 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 421 score: 0.9524 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 422 score: 0.9032 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 423 score: 0.8973 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 424 score: 0.8399 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 425 score: 0.9318 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 426 score: 0.9171 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 427 score: 0.8916 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 428 score: 0.9098 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 429 score: 0.9259 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 430 score: 0.9081 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 431 score: 0.8650 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 432 score: 0.7566 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 433 score: 0.8605 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 434 score: 0.7232 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 435 score: 0.7486 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 436 score: 0.8974 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 437 score: 0.8448 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 438 score: 0.9375 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 439 score: 0.8852 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 440 score: 0.9142 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 441 score: 0.8947 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 442 score: 0.8976 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 443 score: 0.9128 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 444 score: 0.7497 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 445 score: 0.8225 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 446 score: 0.8647 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 447 score: 0.9205 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 448 score: 0.9592 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 449 score: 0.8338 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 450 score: 0.9148 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 451 score: 0.9003 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 452 score: 0.9290 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 453 score: 0.9140 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 454 score: 0.9078 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 455 score: 0.8572 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 456 score: 0.7279 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 457 score: 0.9178 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 458 score: 0.9105 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 459 score: 0.8132 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 460 score: 0.9512 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 461 score: 0.8670 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 462 score: 0.7131 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 463 score: 0.9123 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 464 score: 0.8859 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 465 score: 0.7370 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 466 score: 0.8719 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 467 score: 0.7241 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 468 score: 0.7066 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 469 score: 0.3000 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 470 score: 0.7704 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 471 score: 0.8487 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 472 score: 0.8777 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 473 score: 0.8938 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 474 score: 0.8133 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 475 score: 0.8789 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 476 score: 0.8817 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 477 score: 0.8401 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 478 score: 0.8525 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 479 score: 0.9348 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 480 score: 0.7399 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 481 score: 0.7838 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 482 score: 0.8123 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 483 score: 0.8185 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 484 score: 0.9232 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 485 score: 0.8761 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 486 score: 0.8850 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 487 score: 0.8248 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 488 score: 0.9303 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 489 score: 0.8317 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 490 score: 0.8439 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 491 score: 0.9273 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 492 score: 0.9674 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 493 score: 0.9193 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 494 score: 0.8407 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 495 score: 0.5257 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 496 score: 0.9073 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 497 score: 0.7558 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 498 score: 0.8818 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 499 score: 0.7978 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 500 score: 0.9227 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 501 score: 0.9277 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 502 score: 0.8635 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 503 score: 0.8308 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 504 score: 0.7705 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 505 score: 0.8906 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 506 score: 0.8730 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 507 score: 0.9090 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 508 score: 0.8218 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 509 score: 0.8273 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 510 score: 0.5915 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 511 score: 0.7972 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 512 score: 0.8107 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 513 score: 0.8784 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 514 score: 0.9110 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 515 score: 0.8982 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 516 score: 0.7047 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 517 score: 0.8940 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 518 score: 0.8192 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 519 score: 0.9314 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 520 score: 0.8872 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 521 score: 0.8117 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 522 score: 0.8750 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 523 score: 0.8178 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 524 score: 0.8165 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 525 score: 0.8323 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 526 score: 0.7913 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 527 score: 0.8256 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 528 score: 0.8155 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 529 score: 0.8985 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 530 score: 0.8317 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 531 score: 0.8842 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 532 score: 0.7961 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 533 score: 0.7882 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 534 score: 0.8522 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 535 score: 0.8052 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 536 score: 0.8650 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 537 score: 0.8190 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 538 score: 0.8958 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 539 score: 0.8973 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 540 score: 0.8927 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 541 score: 0.9421 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 542 score: 0.8722 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 543 score: 0.8561 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 544 score: 0.8957 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 545 score: 0.9181 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 546 score: 0.8840 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 547 score: 0.9165 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 548 score: 0.8885 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 549 score: 0.9235 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 550 score: 0.8975 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 551 score: 0.9039 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 552 score: 0.8927 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 553 score: 0.9031 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 554 score: 0.8986 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 555 score: 0.7445 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 556 score: 0.8194 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 557 score: 0.8888 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 558 score: 0.7886 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 559 score: 0.7796 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 560 score: 0.8424 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 561 score: 0.9145 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 562 score: 0.9002 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 563 score: 0.7507 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 564 score: 0.9003 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 565 score: 0.9307 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 566 score: 0.8280 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 567 score: 0.8999 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 568 score: 0.8826 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 569 score: 0.6328 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 570 score: 0.8780 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 571 score: 0.9113 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 572 score: 0.8196 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 573 score: 0.9424 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 574 score: 0.8885 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 575 score: 0.8439 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 576 score: 0.8718 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 577 score: 0.9008 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 578 score: 0.8560 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 579 score: 0.8449 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 580 score: 0.8187 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 581 score: 0.8643 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 582 score: 0.8673 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 583 score: 0.8694 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 584 score: 0.6603 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 585 score: 0.7056 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 586 score: 0.8643 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 587 score: 0.8680 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 588 score: 0.8591 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 589 score: 0.9144 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 590 score: 0.8743 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 591 score: 0.9363 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 592 score: 0.8086 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 593 score: 0.9013 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 594 score: 0.8758 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 595 score: 0.8892 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 596 score: 0.7792 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 597 score: 0.8558 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 598 score: 0.8185 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 599 score: 0.9047 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 600 score: 0.8275 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 601 score: 0.8084 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 602 score: 0.8814 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 603 score: 0.8855 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 604 score: 0.9020 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 605 score: 0.9429 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 606 score: 0.8847 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 607 score: 0.8376 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 608 score: 0.7266 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 609 score: 0.8911 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 610 score: 0.9207 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 611 score: 0.9459 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 612 score: 0.8551 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 613 score: 0.8765 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 614 score: 0.9197 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 615 score: 0.7461 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 616 score: 0.8643 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 617 score: 0.9528 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 618 score: 0.9365 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 619 score: 0.9042 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 620 score: 0.8768 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 621 score: 0.6381 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 622 score: 0.9165 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 623 score: 0.9357 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 624 score: 0.8336 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 625 score: 0.9172 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 626 score: 0.9343 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 627 score: 0.8942 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 628 score: 0.9537 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 629 score: 0.8984 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 630 score: 0.7965 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 631 score: 0.9474 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 632 score: 0.9629 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 633 score: 0.9367 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 634 score: 0.9634 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 635 score: 0.9220 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 636 score: 0.9104 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 637 score: 0.9217 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 638 score: 0.8370 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 639 score: 0.9405 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 640 score: 0.8805 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 641 score: 0.9358 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 642 score: 0.8527 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 643 score: 0.6978 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 644 score: 0.5827 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 645 score: 0.7982 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 646 score: 0.7191 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 647 score: 0.8753 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 648 score: 0.8196 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 649 score: 0.8170 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 650 score: 0.9549 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 651 score: 0.7939 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 652 score: 0.7734 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 653 score: 0.8072 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 654 score: 0.9365 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 655 score: 0.8476 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 656 score: 0.8648 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 657 score: 0.8900 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 658 score: 0.6969 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 659 score: 0.8409 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 660 score: 0.7803 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 661 score: 0.8967 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 662 score: 0.8914 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 663 score: 0.8045 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 664 score: 0.8744 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 665 score: 0.8373 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 666 score: 0.8763 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 667 score: 0.8409 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 668 score: 0.8532 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 669 score: 0.8486 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 670 score: 0.8937 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 671 score: 0.9343 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 672 score: 0.9104 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 673 score: 0.8996 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 674 score: 0.8011 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 675 score: 0.8627 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 676 score: 0.8854 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 677 score: 0.8850 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 678 score: 0.8348 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 679 score: 0.9072 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 680 score: 0.8990 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 681 score: 0.9045 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 682 score: 0.9017 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 683 score: 0.8731 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 684 score: 0.8953 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 685 score: 0.8715 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 686 score: 0.8874 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 687 score: 0.8277 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 688 score: 0.8711 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 689 score: 0.8540 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 690 score: 0.9410 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 691 score: 0.8767 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 692 score: 0.8340 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 693 score: 0.8920 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 694 score: 0.8278 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 695 score: 0.8321 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 696 score: 0.9111 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 697 score: 0.9257 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 698 score: 0.8738 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 699 score: 0.9519 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 700 score: 0.9210 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 701 score: 0.9176 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 702 score: 0.8900 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 703 score: 0.8894 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 704 score: 0.7422 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 705 score: 0.7811 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 706 score: 0.7367 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 707 score: 0.8963 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 708 score: 0.9322 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 709 score: 0.8785 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 710 score: 0.8841 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 711 score: 0.8147 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 712 score: 0.9359 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 713 score: 0.8823 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 714 score: 0.8548 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 715 score: 0.8611 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 716 score: 0.8948 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 717 score: 0.8920 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 718 score: 0.9341 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 719 score: 0.9079 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 720 score: 0.9286 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 721 score: 0.9140 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 722 score: 0.9327 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 723 score: 0.8971 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 724 score: 0.9024 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 725 score: 0.8836 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 726 score: 0.8475 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 727 score: 0.9061 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 728 score: 0.7360 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 729 score: 0.8865 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 730 score: 0.8670 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 731 score: 0.9339 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 732 score: 0.8850 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 733 score: 0.9384 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 734 score: 0.8795 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 735 score: 0.9181 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 736 score: 0.9169 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 737 score: 0.8843 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 738 score: 0.9133 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 739 score: 0.8729 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 740 score: 0.8984 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 741 score: 0.8648 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 742 score: 0.8973 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 743 score: 0.9406 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 744 score: 0.9297 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 745 score: 0.8745 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 746 score: 0.9047 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 747 score: 0.8797 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 748 score: 0.9322 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 749 score: 0.9251 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 750 score: 0.8991 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 751 score: 0.9069 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 752 score: 0.9223 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 753 score: 0.8597 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 754 score: 0.9412 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 755 score: 0.8795 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 756 score: 0.8820 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 757 score: 0.9049 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 758 score: 0.7726 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 759 score: 0.8427 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 760 score: 0.9573 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 761 score: 0.8954 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 762 score: 0.9456 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 763 score: 0.8959 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 764 score: 0.8957 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 765 score: 0.8730 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 766 score: 0.8823 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 767 score: 0.8860 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 768 score: 0.9484 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 769 score: 0.9498 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 770 score: 0.9273 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 771 score: 0.9487 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 772 score: 0.9062 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 773 score: 0.9399 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 774 score: 0.9405 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 775 score: 0.7971 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 776 score: 0.8783 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 777 score: 0.8219 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 778 score: 0.8447 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 779 score: 0.8103 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 780 score: 0.6874 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 781 score: 0.6520 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 782 score: 0.8322 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 783 score: 0.8866 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 784 score: 0.8858 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 785 score: 0.6980 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 786 score: 0.9304 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 787 score: 0.9374 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 788 score: 0.9130 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 789 score: 0.8595 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 790 score: 0.9171 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 791 score: 0.9133 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 792 score: 0.8983 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 793 score: 0.9192 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 794 score: 0.8861 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 795 score: 0.9173 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 796 score: 0.9387 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 797 score: 0.7908 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 798 score: 0.8744 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 799 score: 0.7387 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 800 score: 0.9160 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 801 score: 0.8421 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 802 score: 0.8973 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 803 score: 0.8540 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 804 score: 0.8900 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 805 score: 0.9142 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 806 score: 0.9020 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 807 score: 0.8862 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 808 score: 0.8877 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 809 score: 0.8132 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 810 score: 0.6374 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 811 score: 0.7931 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 812 score: 0.9262 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 813 score: 0.8606 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 814 score: 0.8862 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 815 score: 0.6990 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 816 score: 0.9148 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 817 score: 0.7375 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 818 score: 0.6179 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 819 score: 0.8766 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 820 score: 0.8666 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 821 score: 0.8955 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 822 score: 0.8905 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 823 score: 0.8490 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 824 score: 0.9310 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 825 score: 0.8825 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 826 score: 0.8848 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 827 score: 0.9114 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 828 score: 0.8732 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 829 score: 0.7959 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 830 score: 0.8451 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 831 score: 0.8455 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 832 score: 0.9117 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 833 score: 0.7718 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 834 score: 0.7926 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 835 score: 0.7597 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 836 score: 0.9035 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 837 score: 0.8333 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 838 score: 0.8009 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 839 score: 0.8306 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 840 score: 0.8731 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 841 score: 0.8616 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 842 score: 0.6815 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 843 score: 0.9104 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 844 score: 0.8549 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 845 score: 0.6773 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 846 score: 0.6789 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 847 score: 0.8631 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 848 score: 0.7985 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 849 score: 0.8213 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 850 score: 0.7526 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 851 score: 0.9424 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 852 score: 0.9197 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 853 score: 0.9224 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 854 score: 0.7447 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 855 score: 0.8393 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 856 score: 0.8188 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 857 score: 0.9349 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 858 score: 0.7452 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 859 score: 0.9292 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 860 score: 0.9085 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 861 score: 0.8477 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 862 score: 0.9110 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 863 score: 0.8762 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 864 score: 0.8899 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 865 score: 0.8824 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 866 score: 0.9099 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 867 score: 0.8375 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 868 score: 0.9187 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 869 score: 0.9457 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 870 score: 0.9593 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 871 score: 0.9202 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 872 score: 0.8702 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 873 score: 0.9293 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 874 score: 0.9230 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 875 score: 0.8010 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 876 score: 0.8185 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 877 score: 0.9115 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 878 score: 0.8131 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 879 score: 0.8572 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 880 score: 0.8969 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 881 score: 0.9015 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 882 score: 0.8656 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 883 score: 0.9049 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 884 score: 0.8244 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 885 score: 0.9123 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 886 score: 0.8981 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 887 score: 0.8117 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 888 score: 0.7003 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 889 score: 0.8728 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 890 score: 0.8632 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 891 score: 0.8861 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 892 score: 0.6517 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 893 score: 0.7169 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 894 score: 0.8912 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 895 score: 0.9413 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 896 score: 0.8937 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 897 score: 0.8596 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 898 score: 0.8419 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 899 score: 0.9062 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 900 score: 0.9052 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 901 score: 0.8338 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 902 score: 0.7564 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 903 score: 0.9006 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 904 score: 0.8891 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 905 score: 0.8161 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 906 score: 0.9258 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 907 score: 0.8863 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 908 score: 0.8873 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 909 score: 0.9481 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 910 score: 0.6783 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 911 score: 0.7748 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 912 score: 0.9553 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 913 score: 0.9025 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 914 score: 0.9026 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 915 score: 0.8857 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 916 score: 0.9073 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 917 score: 0.8553 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 918 score: 0.8938 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 919 score: 0.9066 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 920 score: 0.8726 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 921 score: 0.8760 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 922 score: 0.8346 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 923 score: 0.8931 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 924 score: 0.8975 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 925 score: 0.8995 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 926 score: 0.8835 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 927 score: 0.8361 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 928 score: 0.8532 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 929 score: 0.8794 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 930 score: 0.8841 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 931 score: 0.8650 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 932 score: 0.7685 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 933 score: 0.8823 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 934 score: 0.8284 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 935 score: 0.8291 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 936 score: 0.8526 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 937 score: 0.9734 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 938 score: 0.9447 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 939 score: 0.9432 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 940 score: 0.9420 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 941 score: 0.9702 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 942 score: 0.9348 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 943 score: 0.9004 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 944 score: 0.8485 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 945 score: 0.8741 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 946 score: 0.8850 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 947 score: 0.8105 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 948 score: 0.8356 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 949 score: 0.9420 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 950 score: 0.8378 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 951 score: 0.8919 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 952 score: 0.7985 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 953 score: 0.8920 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 954 score: 0.8341 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 955 score: 0.9163 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 956 score: 0.8855 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 957 score: 0.9459 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 958 score: 0.8712 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 959 score: 0.7935 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 960 score: 0.8380 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 961 score: 0.6354 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 962 score: 0.8588 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 963 score: 0.8295 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 964 score: 0.9550 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 965 score: 0.8871 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 966 score: 0.8759 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 967 score: 0.8526 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 968 score: 0.7988 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 969 score: 0.7066 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 970 score: 0.8759 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 971 score: 0.8027 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 972 score: 0.7964 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 973 score: 0.8945 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 974 score: 0.8460 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 975 score: 0.9183 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 976 score: 0.8858 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 977 score: 0.8335 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 978 score: 0.8757 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 979 score: 0.9146 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 980 score: 0.7740 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 981 score: 0.9261 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 982 score: 0.8193 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 983 score: 0.8770 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 984 score: 0.8408 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 985 score: 0.9119 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 986 score: 0.8035 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 987 score: 0.7149 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 988 score: 0.7001 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 989 score: 0.8297 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 990 score: 0.9315 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 991 score: 0.8300 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 992 score: 0.9174 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 993 score: 0.8866 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 994 score: 0.8033 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 995 score: 0.9039 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 996 score: 0.9188 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 997 score: 0.9266 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 998 score: 0.8356 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 999 score: 0.8431 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 1000 score: 0.8194 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 1001 score: 0.8103 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 1002 score: 0.8676 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 1003 score: 0.8636 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 1004 score: 0.9251 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 1005 score: 0.8861 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 1006 score: 0.8816 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 1007 score: 0.9016 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 1008 score: 0.9133 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 1009 score: 0.8141 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 1010 score: 0.9423 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi Segment 1011 score: 0.8593 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-vi-max-tokens-512//test-en-vi score: 0.8649