diff --git "a/test-en-th.comet" "b/test-en-th.comet" new file mode 100644--- /dev/null +++ "b/test-en-th.comet" @@ -0,0 +1,1013 @@ +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 0 score: 0.6353 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 1 score: 0.3283 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 2 score: 0.8375 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 3 score: 0.6063 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 4 score: 0.7918 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 5 score: 0.3093 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 6 score: 0.7073 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 7 score: 0.7575 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 8 score: 0.7602 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 9 score: 0.7100 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 10 score: 0.6010 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 11 score: 0.6250 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 12 score: 0.5853 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 13 score: 0.8843 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 14 score: 0.7461 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 15 score: 0.3103 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 16 score: 0.7701 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 17 score: 0.7381 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 18 score: 0.8792 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 19 score: 0.4600 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 20 score: 0.6407 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 21 score: 0.6099 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 22 score: 0.5089 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 23 score: 0.7679 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 24 score: 0.8081 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 25 score: 0.6827 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 26 score: 0.7313 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 27 score: 0.3902 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 28 score: 0.5643 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 29 score: 0.7712 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 30 score: 0.5727 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 31 score: 0.4288 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 32 score: 0.6357 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 33 score: 0.5162 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 34 score: 0.8972 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 35 score: 0.9219 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 36 score: 0.5127 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 37 score: 0.6802 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 38 score: 0.2617 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 39 score: 0.8562 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 40 score: 0.4720 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 41 score: 0.7866 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 42 score: 0.5120 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 43 score: 0.8173 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 44 score: 0.5847 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 45 score: 0.6866 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 46 score: 0.1885 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 47 score: 0.7578 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 48 score: 0.3399 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 49 score: 0.7067 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 50 score: 0.8346 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 51 score: 0.7851 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 52 score: 0.6071 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 53 score: 0.3033 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 54 score: 0.5505 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 55 score: 0.6533 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 56 score: 0.3394 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 57 score: 0.3775 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 58 score: 0.5530 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 59 score: 0.9343 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 60 score: 0.7256 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 61 score: 0.7900 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 62 score: 0.6446 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 63 score: 0.5347 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 64 score: 0.6103 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 65 score: 0.7408 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 66 score: 0.6518 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 67 score: 0.6131 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 68 score: 0.8585 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 69 score: 0.7208 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 70 score: 0.3095 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 71 score: 0.6323 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 72 score: 0.4104 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 73 score: 0.2141 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 74 score: 0.7930 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 75 score: 0.7294 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 76 score: 0.5763 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 77 score: 0.8520 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 78 score: 0.8816 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 79 score: 0.7346 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 80 score: 0.1501 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 81 score: 0.7714 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 82 score: 0.5842 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 83 score: 0.3569 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 84 score: 0.7358 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 85 score: 0.7486 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 86 score: 0.4660 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 87 score: 0.3412 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 88 score: 0.7451 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 89 score: 0.4920 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 90 score: 0.3983 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 91 score: 0.3266 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 92 score: 0.3021 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 93 score: 0.8193 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 94 score: 0.5761 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 95 score: 0.7141 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 96 score: 0.4746 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 97 score: 0.7682 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 98 score: 0.6170 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 99 score: 0.7143 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 100 score: 0.5711 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 101 score: 0.7490 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 102 score: 0.7312 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 103 score: 0.6600 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 104 score: 0.8214 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 105 score: 0.6223 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 106 score: 0.7469 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 107 score: 0.3166 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 108 score: 0.3044 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 109 score: 0.6406 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 110 score: 0.6222 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 111 score: 0.6828 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 112 score: 0.8184 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 113 score: 0.7337 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 114 score: 0.3892 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 115 score: 0.6566 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 116 score: 0.6240 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 117 score: 0.7508 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 118 score: 0.8047 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 119 score: 0.5992 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 120 score: 0.4672 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 121 score: 0.7878 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 122 score: 0.9144 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 123 score: 0.8217 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 124 score: 0.7380 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 125 score: 0.5495 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 126 score: 0.7530 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 127 score: 0.5659 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 128 score: 0.6639 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 129 score: 0.7214 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 130 score: 0.7572 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 131 score: 0.7801 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 132 score: 0.6860 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 133 score: 0.7523 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 134 score: 0.5362 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 135 score: 0.3818 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 136 score: 0.8530 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 137 score: 0.2661 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 138 score: 0.6803 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 139 score: 0.3041 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 140 score: 0.4085 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 141 score: 0.6493 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 142 score: 0.5043 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 143 score: 0.4972 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 144 score: 0.7485 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 145 score: 0.9020 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 146 score: 0.7204 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 147 score: 0.8378 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 148 score: 0.6133 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 149 score: 0.4771 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 150 score: 0.6961 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 151 score: 0.5982 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 152 score: 0.5998 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 153 score: 0.6297 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 154 score: 0.4739 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 155 score: 0.7400 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 156 score: 0.5987 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 157 score: 0.6145 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 158 score: 0.6792 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 159 score: 0.6821 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 160 score: 0.6309 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 161 score: 0.6073 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 162 score: 0.3989 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 163 score: 0.4350 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 164 score: 0.6690 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 165 score: 0.6324 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 166 score: 0.7422 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 167 score: 0.7897 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 168 score: 0.8375 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 169 score: 0.5994 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 170 score: 0.2363 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 171 score: 0.7812 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 172 score: 0.4356 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 173 score: 0.6022 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 174 score: 0.6249 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 175 score: 0.7112 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 176 score: 0.4429 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 177 score: 0.7135 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 178 score: 0.4447 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 179 score: 0.9058 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 180 score: 0.7464 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 181 score: 0.5920 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 182 score: 0.7552 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 183 score: 0.7716 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 184 score: 0.6379 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 185 score: 0.9114 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 186 score: 0.6672 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 187 score: 0.6179 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 188 score: 0.3473 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 189 score: 0.6096 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 190 score: 0.4964 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 191 score: 0.5370 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 192 score: 0.2800 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 193 score: 0.3682 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 194 score: 0.8051 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 195 score: 0.8557 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 196 score: 0.5267 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 197 score: 0.5906 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 198 score: 0.8432 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 199 score: 0.1957 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 200 score: 0.7548 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 201 score: 0.4238 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 202 score: 0.4362 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 203 score: 0.4824 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 204 score: 0.3011 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 205 score: 0.6225 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 206 score: 0.6152 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 207 score: 0.4741 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 208 score: 0.7324 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 209 score: 0.5559 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 210 score: 0.7581 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 211 score: 0.8488 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 212 score: 0.7270 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 213 score: 0.9038 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 214 score: 0.8432 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 215 score: 0.2104 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 216 score: 0.7919 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 217 score: 0.6350 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 218 score: 0.7726 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 219 score: 0.8504 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 220 score: 0.7757 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 221 score: 0.6272 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 222 score: 0.4273 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 223 score: 0.5623 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 224 score: 0.8725 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 225 score: 0.4658 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 226 score: 0.3593 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 227 score: 0.5325 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 228 score: 0.6577 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 229 score: 0.6519 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 230 score: 0.8947 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 231 score: 0.3194 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 232 score: 0.6912 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 233 score: 0.2103 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 234 score: 0.5631 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 235 score: 0.1753 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 236 score: 0.6755 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 237 score: 0.7711 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 238 score: 0.8673 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 239 score: 0.6066 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 240 score: 0.7507 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 241 score: 0.4892 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 242 score: 0.8019 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 243 score: 0.5124 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 244 score: 0.4080 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 245 score: 0.6934 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 246 score: 0.7155 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 247 score: 0.4310 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 248 score: 0.2149 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 249 score: 0.9041 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 250 score: 0.8840 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 251 score: 0.8741 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 252 score: 0.7428 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 253 score: 0.4222 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 254 score: 0.5197 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 255 score: 0.8756 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 256 score: 0.5589 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 257 score: 0.5787 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 258 score: 0.5621 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 259 score: 0.5426 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 260 score: 0.7839 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 261 score: 0.5078 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 262 score: 0.6100 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 263 score: 0.3860 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 264 score: 0.7507 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 265 score: 0.1542 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 266 score: 0.5995 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 267 score: 0.6491 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 268 score: 0.8059 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 269 score: 0.7539 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 270 score: 0.4257 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 271 score: 0.1786 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 272 score: 0.7895 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 273 score: 0.5950 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 274 score: 0.7557 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 275 score: 0.6590 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 276 score: 0.5512 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 277 score: 0.5416 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 278 score: 0.6360 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 279 score: 0.5804 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 280 score: 0.6843 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 281 score: 0.8399 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 282 score: 0.7812 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 283 score: 0.6595 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 284 score: 0.7063 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 285 score: 0.8677 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 286 score: 0.6692 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 287 score: 0.4547 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 288 score: 0.7152 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 289 score: 0.5397 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 290 score: 0.6345 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 291 score: 0.3883 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 292 score: 0.5185 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 293 score: 0.7389 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 294 score: 0.6424 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 295 score: 0.5024 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 296 score: 0.5521 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 297 score: 0.7961 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 298 score: 0.9062 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 299 score: 0.8551 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 300 score: 0.7961 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 301 score: 0.3934 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 302 score: 0.4899 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 303 score: 0.8375 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 304 score: 0.7779 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 305 score: 0.8351 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 306 score: 0.8445 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 307 score: 0.8304 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 308 score: 0.6404 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 309 score: 0.4597 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 310 score: 0.5259 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 311 score: 0.3233 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 312 score: 0.5998 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 313 score: 0.5071 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 314 score: 0.6084 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 315 score: 0.7723 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 316 score: 0.4554 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 317 score: 0.4888 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 318 score: 0.2982 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 319 score: 0.5028 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 320 score: 0.6357 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 321 score: 0.7339 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 322 score: 0.7606 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 323 score: 0.7753 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 324 score: 0.6740 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 325 score: 0.8759 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 326 score: 0.5367 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 327 score: 0.7376 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 328 score: 0.2390 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 329 score: 0.7517 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 330 score: 0.7402 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 331 score: 0.5256 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 332 score: 0.8255 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 333 score: 0.7839 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 334 score: 0.8691 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 335 score: 0.4598 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 336 score: 0.3091 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 337 score: 0.1506 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 338 score: 0.6732 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 339 score: 0.7991 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 340 score: 0.3467 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 341 score: 0.5477 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 342 score: 0.3484 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 343 score: 0.4067 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 344 score: 0.7523 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 345 score: 0.7575 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 346 score: 0.7017 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 347 score: 0.4601 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 348 score: 0.3565 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 349 score: 0.4583 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 350 score: 0.6405 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 351 score: 0.4548 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 352 score: 0.6719 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 353 score: 0.7126 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 354 score: 0.4574 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 355 score: 0.5438 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 356 score: 0.5682 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 357 score: 0.7599 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 358 score: 0.9143 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 359 score: 0.3981 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 360 score: 0.4831 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 361 score: 0.5936 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 362 score: 0.5080 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 363 score: 0.3769 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 364 score: 0.7099 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 365 score: 0.5975 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 366 score: 0.3447 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 367 score: 0.7197 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 368 score: 0.3315 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 369 score: 0.6188 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 370 score: 0.4162 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 371 score: 0.2017 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 372 score: 0.2066 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 373 score: 0.7570 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 374 score: 0.7954 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 375 score: 0.5993 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 376 score: 0.5810 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 377 score: 0.2352 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 378 score: 0.2066 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 379 score: 0.4168 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 380 score: 0.7671 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 381 score: 0.3795 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 382 score: 0.4694 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 383 score: 0.6009 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 384 score: 0.6612 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 385 score: 0.4777 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 386 score: 0.3955 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 387 score: 0.7275 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 388 score: 0.3022 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 389 score: 0.7743 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 390 score: 0.4396 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 391 score: 0.6346 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 392 score: 0.5792 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 393 score: 0.7343 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 394 score: 0.8558 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 395 score: 0.4816 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 396 score: 0.7087 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 397 score: 0.4154 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 398 score: 0.6032 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 399 score: 0.7171 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 400 score: 0.8203 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 401 score: 0.2219 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 402 score: 0.7739 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 403 score: 0.6132 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 404 score: 0.5032 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 405 score: 0.2259 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 406 score: 0.6488 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 407 score: 0.6493 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 408 score: 0.6762 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 409 score: 0.7710 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 410 score: 0.6445 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 411 score: 0.6705 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 412 score: 0.6648 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 413 score: 0.1973 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 414 score: 0.6293 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 415 score: 0.8035 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 416 score: 0.7558 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 417 score: 0.3209 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 418 score: 0.8010 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 419 score: 0.7613 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 420 score: 0.7970 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 421 score: 0.9265 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 422 score: 0.3999 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 423 score: 0.7186 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 424 score: 0.5875 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 425 score: 0.7349 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 426 score: 0.4055 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 427 score: 0.5815 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 428 score: 0.7890 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 429 score: 0.6845 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 430 score: 0.6944 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 431 score: 0.7526 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 432 score: 0.6731 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 433 score: 0.2217 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 434 score: 0.5128 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 435 score: 0.4672 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 436 score: 0.4805 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 437 score: 0.7189 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 438 score: 0.6849 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 439 score: 0.6581 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 440 score: 0.5482 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 441 score: 0.8049 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 442 score: 0.7102 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 443 score: 0.5830 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 444 score: 0.6554 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 445 score: 0.6485 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 446 score: 0.6028 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 447 score: 0.7830 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 448 score: 0.8809 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 449 score: 0.5965 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 450 score: 0.4139 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 451 score: 0.6349 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 452 score: 0.5408 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 453 score: 0.6900 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 454 score: 0.6510 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 455 score: 0.6666 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 456 score: 0.3166 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 457 score: 0.6705 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 458 score: 0.1700 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 459 score: 0.6104 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 460 score: 0.5341 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 461 score: 0.6447 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 462 score: 0.6212 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 463 score: 0.6363 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 464 score: 0.4029 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 465 score: 0.6123 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 466 score: 0.3863 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 467 score: 0.5340 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 468 score: 0.2637 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 469 score: 0.3466 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 470 score: 0.4662 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 471 score: 0.6016 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 472 score: 0.4681 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 473 score: 0.1923 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 474 score: 0.4490 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 475 score: 0.2797 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 476 score: 0.7000 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 477 score: 0.6485 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 478 score: 0.7031 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 479 score: 0.7655 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 480 score: 0.4480 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 481 score: 0.5250 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 482 score: 0.3073 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 483 score: 0.6290 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 484 score: 0.3063 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 485 score: 0.7117 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 486 score: 0.6741 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 487 score: 0.5776 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 488 score: 0.7113 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 489 score: 0.6795 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 490 score: 0.4790 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 491 score: 0.8003 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 492 score: 0.9363 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 493 score: 0.5552 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 494 score: 0.7596 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 495 score: 0.5939 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 496 score: 0.5854 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 497 score: 0.2655 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 498 score: 0.2211 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 499 score: 0.7904 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 500 score: 0.7778 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 501 score: 0.3482 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 502 score: 0.7569 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 503 score: 0.6465 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 504 score: 0.4802 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 505 score: 0.5964 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 506 score: 0.7551 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 507 score: 0.6320 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 508 score: 0.6035 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 509 score: 0.8032 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 510 score: 0.5380 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 511 score: 0.7099 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 512 score: 0.4274 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 513 score: 0.6788 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 514 score: 0.8358 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 515 score: 0.6658 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 516 score: 0.4880 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 517 score: 0.7703 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 518 score: 0.7727 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 519 score: 0.7410 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 520 score: 0.7025 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 521 score: 0.7508 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 522 score: 0.3396 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 523 score: 0.7094 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 524 score: 0.7697 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 525 score: 0.5668 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 526 score: 0.4225 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 527 score: 0.4235 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 528 score: 0.3148 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 529 score: 0.6787 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 530 score: 0.3567 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 531 score: 0.3368 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 532 score: 0.4455 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 533 score: 0.5547 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 534 score: 0.4643 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 535 score: 0.6547 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 536 score: 0.5730 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 537 score: 0.4330 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 538 score: 0.2998 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 539 score: 0.4777 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 540 score: 0.6400 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 541 score: 0.4168 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 542 score: 0.6996 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 543 score: 0.4278 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 544 score: 0.5607 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 545 score: 0.6824 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 546 score: 0.8328 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 547 score: 0.6972 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 548 score: 0.5509 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 549 score: 0.8215 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 550 score: 0.3716 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 551 score: 0.8298 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 552 score: 0.6869 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 553 score: 0.6820 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 554 score: 0.6142 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 555 score: 0.3981 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 556 score: 0.3911 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 557 score: 0.8466 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 558 score: 0.2903 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 559 score: 0.2893 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 560 score: 0.2561 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 561 score: 0.2809 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 562 score: 0.3401 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 563 score: 0.4919 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 564 score: 0.6563 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 565 score: 0.7405 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 566 score: 0.7600 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 567 score: 0.6625 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 568 score: 0.5746 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 569 score: 0.5474 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 570 score: 0.6345 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 571 score: 0.7407 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 572 score: 0.3746 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 573 score: 0.7120 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 574 score: 0.6391 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 575 score: 0.5242 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 576 score: 0.4798 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 577 score: 0.7207 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 578 score: 0.8454 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 579 score: 0.4207 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 580 score: 0.4912 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 581 score: 0.6831 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 582 score: 0.3457 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 583 score: 0.6397 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 584 score: 0.5708 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 585 score: 0.5659 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 586 score: 0.5605 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 587 score: 0.6767 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 588 score: 0.6158 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 589 score: 0.4980 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 590 score: 0.7611 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 591 score: 0.8234 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 592 score: 0.4131 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 593 score: 0.3218 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 594 score: 0.5897 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 595 score: 0.5813 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 596 score: 0.5310 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 597 score: 0.3525 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 598 score: 0.3492 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 599 score: 0.6228 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 600 score: 0.6744 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 601 score: 0.3555 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 602 score: 0.3849 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 603 score: 0.2660 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 604 score: 0.8711 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 605 score: 0.3129 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 606 score: 0.7267 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 607 score: 0.6292 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 608 score: 0.3345 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 609 score: 0.6739 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 610 score: 0.4510 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 611 score: 0.8384 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 612 score: 0.5228 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 613 score: 0.5838 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 614 score: 0.4268 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 615 score: 0.4039 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 616 score: 0.7496 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 617 score: 0.7201 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 618 score: 0.6230 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 619 score: 0.2501 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 620 score: 0.6391 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 621 score: 0.4195 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 622 score: 0.3283 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 623 score: 0.2049 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 624 score: 0.6832 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 625 score: 0.8274 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 626 score: 0.8004 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 627 score: 0.8778 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 628 score: 0.8771 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 629 score: 0.7215 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 630 score: 0.6220 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 631 score: 0.8488 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 632 score: 0.8287 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 633 score: 0.7353 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 634 score: 0.8752 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 635 score: 0.6977 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 636 score: 0.5653 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 637 score: 0.7211 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 638 score: 0.2106 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 639 score: 0.2109 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 640 score: 0.2205 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 641 score: 0.7807 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 642 score: 0.5452 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 643 score: 0.5851 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 644 score: 0.4949 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 645 score: 0.5427 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 646 score: 0.6732 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 647 score: 0.4921 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 648 score: 0.1816 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 649 score: 0.2375 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 650 score: 0.4828 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 651 score: 0.4081 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 652 score: 0.4093 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 653 score: 0.4043 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 654 score: 0.5060 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 655 score: 0.7034 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 656 score: 0.8464 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 657 score: 0.3807 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 658 score: 0.3697 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 659 score: 0.4115 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 660 score: 0.7924 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 661 score: 0.8177 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 662 score: 0.7823 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 663 score: 0.6608 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 664 score: 0.3701 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 665 score: 0.7983 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 666 score: 0.6816 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 667 score: 0.7256 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 668 score: 0.7101 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 669 score: 0.7438 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 670 score: 0.7057 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 671 score: 0.7908 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 672 score: 0.8974 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 673 score: 0.5745 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 674 score: 0.2260 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 675 score: 0.2934 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 676 score: 0.8216 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 677 score: 0.7014 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 678 score: 0.6879 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 679 score: 0.3360 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 680 score: 0.4597 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 681 score: 0.3600 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 682 score: 0.7739 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 683 score: 0.4503 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 684 score: 0.8176 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 685 score: 0.7466 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 686 score: 0.8064 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 687 score: 0.6155 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 688 score: 0.7066 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 689 score: 0.6684 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 690 score: 0.8415 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 691 score: 0.6016 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 692 score: 0.8482 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 693 score: 0.7118 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 694 score: 0.2483 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 695 score: 0.6483 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 696 score: 0.6508 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 697 score: 0.8079 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 698 score: 0.7326 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 699 score: 0.6757 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 700 score: 0.4031 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 701 score: 0.7210 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 702 score: 0.7401 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 703 score: 0.6771 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 704 score: 0.2464 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 705 score: 0.4473 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 706 score: 0.6465 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 707 score: 0.2288 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 708 score: 0.4394 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 709 score: 0.7454 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 710 score: 0.5601 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 711 score: 0.2363 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 712 score: 0.8589 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 713 score: 0.6821 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 714 score: 0.5585 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 715 score: 0.3970 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 716 score: 0.8374 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 717 score: 0.5734 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 718 score: 0.8302 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 719 score: 0.6284 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 720 score: 0.6215 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 721 score: 0.4466 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 722 score: 0.7034 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 723 score: 0.8020 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 724 score: 0.7842 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 725 score: 0.8006 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 726 score: 0.3489 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 727 score: 0.6600 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 728 score: 0.6035 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 729 score: 0.6079 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 730 score: 0.5027 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 731 score: 0.6072 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 732 score: 0.5222 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 733 score: 0.7340 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 734 score: 0.2982 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 735 score: 0.2226 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 736 score: 0.6709 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 737 score: 0.8079 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 738 score: 0.3056 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 739 score: 0.7871 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 740 score: 0.8320 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 741 score: 0.2110 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 742 score: 0.5099 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 743 score: 0.5636 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 744 score: 0.6004 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 745 score: 0.4520 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 746 score: 0.7044 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 747 score: 0.4711 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 748 score: 0.5504 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 749 score: 0.6084 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 750 score: 0.7450 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 751 score: 0.8609 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 752 score: 0.7680 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 753 score: 0.6434 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 754 score: 0.6421 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 755 score: 0.5925 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 756 score: 0.6397 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 757 score: 0.7671 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 758 score: 0.3188 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 759 score: 0.5066 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 760 score: 0.7904 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 761 score: 0.5883 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 762 score: 0.5491 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 763 score: 0.6389 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 764 score: 0.5625 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 765 score: 0.2602 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 766 score: 0.7321 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 767 score: 0.3525 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 768 score: 0.8844 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 769 score: 0.8284 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 770 score: 0.2276 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 771 score: 0.6904 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 772 score: 0.6845 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 773 score: 0.7327 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 774 score: 0.7388 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 775 score: 0.4413 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 776 score: 0.5565 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 777 score: 0.6946 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 778 score: 0.2128 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 779 score: 0.3278 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 780 score: 0.4952 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 781 score: 0.4750 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 782 score: 0.8174 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 783 score: 0.8263 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 784 score: 0.5391 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 785 score: 0.4559 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 786 score: 0.6056 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 787 score: 0.5196 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 788 score: 0.8632 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 789 score: 0.7311 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 790 score: 0.5327 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 791 score: 0.8257 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 792 score: 0.7144 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 793 score: 0.6684 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 794 score: 0.6719 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 795 score: 0.2388 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 796 score: 0.2755 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 797 score: 0.4972 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 798 score: 0.7492 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 799 score: 0.2393 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 800 score: 0.7759 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 801 score: 0.6866 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 802 score: 0.4517 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 803 score: 0.6133 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 804 score: 0.3237 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 805 score: 0.3180 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 806 score: 0.5990 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 807 score: 0.6953 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 808 score: 0.6157 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 809 score: 0.3321 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 810 score: 0.2758 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 811 score: 0.3539 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 812 score: 0.7241 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 813 score: 0.7299 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 814 score: 0.8986 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 815 score: 0.7473 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 816 score: 0.7957 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 817 score: 0.1953 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 818 score: 0.2090 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 819 score: 0.3555 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 820 score: 0.6171 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 821 score: 0.5369 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 822 score: 0.5466 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 823 score: 0.8886 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 824 score: 0.3779 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 825 score: 0.3534 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 826 score: 0.6791 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 827 score: 0.5652 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 828 score: 0.6377 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 829 score: 0.4208 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 830 score: 0.2863 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 831 score: 0.7142 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 832 score: 0.6004 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 833 score: 0.5009 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 834 score: 0.2829 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 835 score: 0.7946 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 836 score: 0.3122 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 837 score: 0.5794 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 838 score: 0.4596 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 839 score: 0.7196 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 840 score: 0.7837 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 841 score: 0.3608 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 842 score: 0.4630 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 843 score: 0.4229 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 844 score: 0.2037 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 845 score: 0.1891 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 846 score: 0.2086 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 847 score: 0.5787 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 848 score: 0.3348 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 849 score: 0.2969 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 850 score: 0.4335 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 851 score: 0.5712 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 852 score: 0.8106 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 853 score: 0.5949 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 854 score: 0.3947 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 855 score: 0.5663 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 856 score: 0.4958 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 857 score: 0.9014 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 858 score: 0.5846 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 859 score: 0.7272 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 860 score: 0.7430 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 861 score: 0.6305 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 862 score: 0.8220 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 863 score: 0.2128 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 864 score: 0.5556 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 865 score: 0.4934 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 866 score: 0.7244 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 867 score: 0.8531 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 868 score: 0.6987 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 869 score: 0.7832 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 870 score: 0.7163 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 871 score: 0.7999 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 872 score: 0.6331 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 873 score: 0.3518 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 874 score: 0.5354 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 875 score: 0.4414 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 876 score: 0.2892 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 877 score: 0.8008 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 878 score: 0.7379 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 879 score: 0.7978 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 880 score: 0.6713 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 881 score: 0.7273 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 882 score: 0.3324 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 883 score: 0.7390 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 884 score: 0.7348 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 885 score: 0.6855 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 886 score: 0.6221 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 887 score: 0.5094 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 888 score: 0.3641 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 889 score: 0.2647 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 890 score: 0.5932 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 891 score: 0.5861 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 892 score: 0.6080 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 893 score: 0.4537 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 894 score: 0.7683 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 895 score: 0.8723 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 896 score: 0.7256 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 897 score: 0.7140 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 898 score: 0.6175 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 899 score: 0.5589 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 900 score: 0.2350 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 901 score: 0.5596 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 902 score: 0.3610 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 903 score: 0.4710 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 904 score: 0.8233 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 905 score: 0.2914 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 906 score: 0.6518 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 907 score: 0.2409 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 908 score: 0.6382 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 909 score: 0.2012 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 910 score: 0.7257 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 911 score: 0.7698 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 912 score: 0.9543 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 913 score: 0.6993 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 914 score: 0.6761 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 915 score: 0.8135 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 916 score: 0.9018 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 917 score: 0.6322 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 918 score: 0.7475 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 919 score: 0.6689 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 920 score: 0.1878 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 921 score: 0.7491 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 922 score: 0.6317 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 923 score: 0.8523 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 924 score: 0.2631 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 925 score: 0.1798 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 926 score: 0.8078 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 927 score: 0.7416 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 928 score: 0.7780 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 929 score: 0.6434 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 930 score: 0.7171 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 931 score: 0.7771 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 932 score: 0.6791 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 933 score: 0.6773 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 934 score: 0.6554 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 935 score: 0.6232 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 936 score: 0.8488 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 937 score: 0.8836 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 938 score: 0.6552 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 939 score: 0.7194 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 940 score: 0.7359 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 941 score: 0.8380 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 942 score: 0.8530 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 943 score: 0.1445 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 944 score: 0.3272 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 945 score: 0.5388 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 946 score: 0.4246 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 947 score: 0.5499 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 948 score: 0.7003 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 949 score: 0.8616 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 950 score: 0.7778 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 951 score: 0.2733 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 952 score: 0.3625 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 953 score: 0.1860 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 954 score: 0.4426 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 955 score: 0.6977 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 956 score: 0.7802 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 957 score: 0.7533 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 958 score: 0.2779 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 959 score: 0.5375 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 960 score: 0.4801 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 961 score: 0.2984 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 962 score: 0.3503 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 963 score: 0.6458 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 964 score: 0.8120 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 965 score: 0.2452 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 966 score: 0.5138 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 967 score: 0.2432 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 968 score: 0.1721 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 969 score: 0.5566 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 970 score: 0.6999 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 971 score: 0.4899 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 972 score: 0.3531 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 973 score: 0.3091 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 974 score: 0.6114 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 975 score: 0.8796 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 976 score: 0.7433 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 977 score: 0.7782 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 978 score: 0.4023 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 979 score: 0.7781 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 980 score: 0.3270 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 981 score: 0.7631 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 982 score: 0.5120 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 983 score: 0.3032 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 984 score: 0.6692 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 985 score: 0.6974 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 986 score: 0.5196 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 987 score: 0.2467 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 988 score: 0.4720 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 989 score: 0.2875 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 990 score: 0.8051 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 991 score: 0.5250 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 992 score: 0.4029 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 993 score: 0.6971 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 994 score: 0.8423 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 995 score: 0.6462 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 996 score: 0.8496 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 997 score: 0.9192 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 998 score: 0.4208 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 999 score: 0.6194 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 1000 score: 0.7611 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 1001 score: 0.4904 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 1002 score: 0.5294 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 1003 score: 0.3290 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 1004 score: 0.2469 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 1005 score: 0.6434 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 1006 score: 0.7824 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 1007 score: 0.8193 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 1008 score: 0.5380 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 1009 score: 0.6487 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 1010 score: 0.7491 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th Segment 1011 score: 0.7541 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-th-max-tokens-512//test-en-th score: 0.5928