diff --git "a/test-en-hu.comet" "b/test-en-hu.comet" new file mode 100644--- /dev/null +++ "b/test-en-hu.comet" @@ -0,0 +1,1013 @@ +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 0 score: 0.8486 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 1 score: 0.9080 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 2 score: 0.9127 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 3 score: 0.8192 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 4 score: 0.7895 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 5 score: 0.6673 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 6 score: 0.6522 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 7 score: 0.8823 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 8 score: 0.8812 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 9 score: 0.6983 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 10 score: 0.9079 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 11 score: 0.8447 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 12 score: 0.8248 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 13 score: 0.8864 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 14 score: 0.8195 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 15 score: 0.8444 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 16 score: 0.8186 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 17 score: 0.9478 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 18 score: 0.9228 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 19 score: 0.9022 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 20 score: 0.9555 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 21 score: 0.9444 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 22 score: 0.8964 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 23 score: 0.8891 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 24 score: 0.9026 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 25 score: 0.9401 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 26 score: 0.9103 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 27 score: 0.7876 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 28 score: 0.8262 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 29 score: 0.8648 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 30 score: 0.8024 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 31 score: 0.8490 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 32 score: 0.8829 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 33 score: 0.9154 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 34 score: 0.9292 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 35 score: 0.9268 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 36 score: 0.8840 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 37 score: 0.9143 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 38 score: 0.8401 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 39 score: 0.8950 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 40 score: 0.8719 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 41 score: 0.9289 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 42 score: 0.9230 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 43 score: 0.9072 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 44 score: 0.8242 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 45 score: 0.8722 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 46 score: 0.9116 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 47 score: 0.8855 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 48 score: 0.8572 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 49 score: 0.8283 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 50 score: 0.7947 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 51 score: 0.9035 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 52 score: 0.9379 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 53 score: 0.9277 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 54 score: 0.7813 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 55 score: 0.8888 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 56 score: 0.8225 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 57 score: 0.8621 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 58 score: 0.8565 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 59 score: 0.9592 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 60 score: 0.9101 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 61 score: 0.9463 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 62 score: 0.8342 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 63 score: 0.8743 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 64 score: 0.9144 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 65 score: 0.8311 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 66 score: 0.7084 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 67 score: 0.7379 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 68 score: 0.9417 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 69 score: 0.8620 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 70 score: 0.7356 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 71 score: 0.7888 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 72 score: 0.9000 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 73 score: 0.8803 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 74 score: 0.8442 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 75 score: 0.8742 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 76 score: 0.8838 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 77 score: 0.8226 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 78 score: 0.9459 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 79 score: 0.8863 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 80 score: 0.8932 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 81 score: 0.9368 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 82 score: 0.8540 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 83 score: 0.8221 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 84 score: 0.8361 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 85 score: 0.9142 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 86 score: 0.8420 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 87 score: 0.8253 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 88 score: 0.9246 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 89 score: 0.8344 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 90 score: 0.7535 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 91 score: 0.8841 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 92 score: 0.8679 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 93 score: 0.8214 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 94 score: 0.8400 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 95 score: 0.9198 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 96 score: 0.8943 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 97 score: 0.9125 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 98 score: 0.9295 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 99 score: 0.8780 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 100 score: 0.7985 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 101 score: 0.8135 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 102 score: 0.9115 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 103 score: 0.9630 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 104 score: 0.8180 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 105 score: 0.7906 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 106 score: 0.8943 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 107 score: 0.8788 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 108 score: 0.3371 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 109 score: 0.8306 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 110 score: 0.8903 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 111 score: 0.8999 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 112 score: 0.9328 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 113 score: 0.8975 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 114 score: 0.8118 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 115 score: 0.8831 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 116 score: 0.8806 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 117 score: 0.9349 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 118 score: 0.9556 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 119 score: 0.8322 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 120 score: 0.8807 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 121 score: 0.9240 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 122 score: 0.9646 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 123 score: 0.9666 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 124 score: 0.8960 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 125 score: 0.9127 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 126 score: 0.9022 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 127 score: 0.8942 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 128 score: 0.9065 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 129 score: 0.9222 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 130 score: 0.8931 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 131 score: 0.8638 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 132 score: 0.8889 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 133 score: 0.9521 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 134 score: 0.7957 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 135 score: 0.6600 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 136 score: 0.9161 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 137 score: 0.7569 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 138 score: 0.9467 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 139 score: 0.8237 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 140 score: 0.9185 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 141 score: 0.7823 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 142 score: 0.8748 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 143 score: 0.8983 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 144 score: 0.8994 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 145 score: 0.9301 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 146 score: 0.9223 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 147 score: 0.8859 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 148 score: 0.8678 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 149 score: 0.8940 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 150 score: 0.8731 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 151 score: 0.8904 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 152 score: 0.7785 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 153 score: 0.8223 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 154 score: 0.7969 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 155 score: 0.7947 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 156 score: 0.8551 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 157 score: 0.7466 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 158 score: 0.9402 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 159 score: 0.9252 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 160 score: 0.9172 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 161 score: 0.8492 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 162 score: 0.8217 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 163 score: 0.8267 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 164 score: 0.9435 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 165 score: 0.8001 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 166 score: 0.7967 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 167 score: 0.8916 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 168 score: 0.8697 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 169 score: 0.8270 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 170 score: 0.8529 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 171 score: 0.9089 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 172 score: 0.9079 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 173 score: 0.8577 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 174 score: 0.8415 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 175 score: 0.9236 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 176 score: 0.8524 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 177 score: 0.9242 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 178 score: 0.8394 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 179 score: 0.9293 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 180 score: 0.9153 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 181 score: 0.9172 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 182 score: 0.9298 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 183 score: 0.9614 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 184 score: 0.9133 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 185 score: 0.9135 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 186 score: 0.9400 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 187 score: 0.8972 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 188 score: 0.8466 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 189 score: 0.8337 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 190 score: 0.8469 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 191 score: 0.9022 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 192 score: 0.8887 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 193 score: 0.8623 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 194 score: 0.9039 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 195 score: 0.9488 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 196 score: 0.8261 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 197 score: 0.8427 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 198 score: 0.8479 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 199 score: 0.8698 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 200 score: 0.8209 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 201 score: 0.8448 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 202 score: 0.8261 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 203 score: 0.7571 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 204 score: 0.9059 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 205 score: 0.9028 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 206 score: 0.9293 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 207 score: 0.8816 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 208 score: 0.8416 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 209 score: 0.9388 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 210 score: 0.8737 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 211 score: 0.9014 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 212 score: 0.9021 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 213 score: 0.9447 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 214 score: 0.9345 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 215 score: 0.8602 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 216 score: 0.7063 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 217 score: 0.8880 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 218 score: 0.8850 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 219 score: 0.8757 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 220 score: 0.9664 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 221 score: 0.9329 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 222 score: 0.9188 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 223 score: 0.8904 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 224 score: 0.9260 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 225 score: 0.9455 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 226 score: 0.8931 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 227 score: 0.7954 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 228 score: 0.8555 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 229 score: 0.7691 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 230 score: 0.9607 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 231 score: 0.9361 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 232 score: 0.9043 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 233 score: 0.9540 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 234 score: 0.8262 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 235 score: 0.8601 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 236 score: 0.8378 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 237 score: 0.8532 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 238 score: 0.8935 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 239 score: 0.8455 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 240 score: 0.8462 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 241 score: 0.8269 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 242 score: 0.8167 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 243 score: 0.7771 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 244 score: 0.8263 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 245 score: 0.8955 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 246 score: 0.7726 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 247 score: 0.8290 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 248 score: 0.6121 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 249 score: 0.8640 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 250 score: 0.9062 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 251 score: 0.9294 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 252 score: 0.9462 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 253 score: 0.9465 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 254 score: 0.9448 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 255 score: 0.9319 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 256 score: 0.8607 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 257 score: 0.9397 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 258 score: 0.8775 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 259 score: 0.8672 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 260 score: 0.8560 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 261 score: 0.6985 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 262 score: 0.9283 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 263 score: 0.7736 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 264 score: 0.9319 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 265 score: 0.8900 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 266 score: 0.8655 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 267 score: 0.8923 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 268 score: 0.9415 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 269 score: 0.7791 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 270 score: 0.8120 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 271 score: 0.8433 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 272 score: 0.9043 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 273 score: 0.8958 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 274 score: 0.7450 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 275 score: 0.8105 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 276 score: 0.7431 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 277 score: 0.8944 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 278 score: 0.9182 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 279 score: 0.9496 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 280 score: 0.9239 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 281 score: 0.9596 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 282 score: 0.9707 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 283 score: 0.8768 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 284 score: 0.9249 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 285 score: 0.9396 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 286 score: 0.8707 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 287 score: 0.8799 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 288 score: 0.9106 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 289 score: 0.9373 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 290 score: 0.8775 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 291 score: 0.8088 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 292 score: 0.9465 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 293 score: 0.9168 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 294 score: 0.8659 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 295 score: 0.8298 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 296 score: 0.8358 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 297 score: 0.9014 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 298 score: 0.9443 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 299 score: 0.9123 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 300 score: 0.8839 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 301 score: 0.9222 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 302 score: 0.9066 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 303 score: 0.8958 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 304 score: 0.8778 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 305 score: 0.9001 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 306 score: 0.8766 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 307 score: 0.8644 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 308 score: 0.9289 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 309 score: 0.8638 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 310 score: 0.9641 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 311 score: 0.8573 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 312 score: 0.7573 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 313 score: 0.7495 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 314 score: 0.9600 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 315 score: 0.9300 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 316 score: 0.8980 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 317 score: 0.8664 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 318 score: 0.9291 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 319 score: 0.6815 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 320 score: 0.8056 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 321 score: 0.8443 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 322 score: 0.8900 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 323 score: 0.8978 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 324 score: 0.9490 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 325 score: 0.8652 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 326 score: 0.8838 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 327 score: 0.8299 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 328 score: 0.8881 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 329 score: 0.8932 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 330 score: 0.8835 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 331 score: 0.8801 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 332 score: 0.9284 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 333 score: 0.9193 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 334 score: 0.9005 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 335 score: 0.9244 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 336 score: 0.8718 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 337 score: 0.8840 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 338 score: 0.9038 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 339 score: 0.9433 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 340 score: 0.8327 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 341 score: 0.6678 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 342 score: 0.5782 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 343 score: 0.5663 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 344 score: 0.8561 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 345 score: 0.8330 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 346 score: 0.9206 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 347 score: 0.9187 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 348 score: 0.8858 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 349 score: 0.8546 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 350 score: 0.7791 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 351 score: 0.7348 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 352 score: 0.9235 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 353 score: 0.8150 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 354 score: 0.8543 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 355 score: 0.8769 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 356 score: 0.9168 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 357 score: 0.8773 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 358 score: 0.8376 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 359 score: 0.7431 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 360 score: 0.8114 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 361 score: 0.8715 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 362 score: 0.8608 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 363 score: 0.8996 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 364 score: 0.8460 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 365 score: 0.8419 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 366 score: 0.5748 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 367 score: 0.7781 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 368 score: 0.2177 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 369 score: 0.8276 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 370 score: 0.8342 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 371 score: 0.8089 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 372 score: 0.8634 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 373 score: 0.8670 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 374 score: 0.9057 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 375 score: 0.9580 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 376 score: 0.9246 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 377 score: 0.9459 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 378 score: 0.8531 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 379 score: 0.8802 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 380 score: 0.9443 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 381 score: 0.7495 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 382 score: 0.6128 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 383 score: 0.8120 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 384 score: 0.8821 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 385 score: 0.7468 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 386 score: 0.3951 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 387 score: 0.8838 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 388 score: 0.6065 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 389 score: 0.9538 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 390 score: 0.9476 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 391 score: 0.9357 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 392 score: 0.9243 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 393 score: 0.9471 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 394 score: 0.8998 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 395 score: 0.9502 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 396 score: 0.9047 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 397 score: 0.9371 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 398 score: 0.8410 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 399 score: 0.9485 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 400 score: 0.9242 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 401 score: 0.8499 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 402 score: 0.9392 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 403 score: 0.8120 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 404 score: 0.7595 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 405 score: 0.8684 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 406 score: 0.9522 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 407 score: 0.9118 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 408 score: 0.9256 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 409 score: 0.9371 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 410 score: 0.8967 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 411 score: 0.7898 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 412 score: 0.8624 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 413 score: 0.9332 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 414 score: 0.8656 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 415 score: 0.8989 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 416 score: 0.8927 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 417 score: 0.7785 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 418 score: 0.9528 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 419 score: 0.9427 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 420 score: 0.9222 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 421 score: 0.9558 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 422 score: 0.8581 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 423 score: 0.9133 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 424 score: 0.9204 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 425 score: 0.8926 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 426 score: 0.9232 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 427 score: 0.9408 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 428 score: 0.9106 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 429 score: 0.9269 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 430 score: 0.9167 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 431 score: 0.7574 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 432 score: 0.8508 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 433 score: 0.6332 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 434 score: 0.8617 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 435 score: 0.8129 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 436 score: 0.8204 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 437 score: 0.7873 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 438 score: 0.9251 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 439 score: 0.8540 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 440 score: 0.9168 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 441 score: 0.9110 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 442 score: 0.9256 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 443 score: 0.8944 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 444 score: 0.8640 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 445 score: 0.8933 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 446 score: 0.8854 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 447 score: 0.8952 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 448 score: 0.9035 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 449 score: 0.7812 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 450 score: 0.9066 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 451 score: 0.9160 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 452 score: 0.9457 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 453 score: 0.9280 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 454 score: 0.8771 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 455 score: 0.9016 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 456 score: 0.7434 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 457 score: 0.9298 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 458 score: 0.8621 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 459 score: 0.8385 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 460 score: 0.9111 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 461 score: 0.8086 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 462 score: 0.8023 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 463 score: 0.9054 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 464 score: 0.9238 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 465 score: 0.8780 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 466 score: 0.9270 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 467 score: 0.8082 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 468 score: 0.5141 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 469 score: 0.5789 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 470 score: 0.8142 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 471 score: 0.7016 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 472 score: 0.8386 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 473 score: 0.8000 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 474 score: 0.8147 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 475 score: 0.9194 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 476 score: 0.8306 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 477 score: 0.8945 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 478 score: 0.9414 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 479 score: 0.9289 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 480 score: 0.9138 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 481 score: 0.7924 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 482 score: 0.8587 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 483 score: 0.8986 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 484 score: 0.8252 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 485 score: 0.8640 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 486 score: 0.8830 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 487 score: 0.8531 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 488 score: 0.8979 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 489 score: 0.8214 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 490 score: 0.7925 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 491 score: 0.8723 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 492 score: 0.9609 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 493 score: 0.9076 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 494 score: 0.9236 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 495 score: 0.9090 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 496 score: 0.8484 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 497 score: 0.8125 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 498 score: 0.8884 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 499 score: 0.8315 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 500 score: 0.9146 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 501 score: 0.9095 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 502 score: 0.9008 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 503 score: 0.8438 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 504 score: 0.8312 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 505 score: 0.8455 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 506 score: 0.7260 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 507 score: 0.8125 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 508 score: 0.9035 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 509 score: 0.8512 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 510 score: 0.7978 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 511 score: 0.7496 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 512 score: 0.7942 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 513 score: 0.7397 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 514 score: 0.8429 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 515 score: 0.9285 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 516 score: 0.8538 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 517 score: 0.8500 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 518 score: 0.9193 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 519 score: 0.9420 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 520 score: 0.9049 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 521 score: 0.8160 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 522 score: 0.8169 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 523 score: 0.8362 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 524 score: 0.8977 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 525 score: 0.9182 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 526 score: 0.8991 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 527 score: 0.7324 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 528 score: 0.8964 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 529 score: 0.8492 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 530 score: 0.8714 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 531 score: 0.9210 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 532 score: 0.8853 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 533 score: 0.8441 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 534 score: 0.8452 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 535 score: 0.6722 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 536 score: 0.7587 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 537 score: 0.8432 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 538 score: 0.8680 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 539 score: 0.9317 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 540 score: 0.9054 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 541 score: 0.9010 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 542 score: 0.8994 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 543 score: 0.8841 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 544 score: 0.9176 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 545 score: 0.9674 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 546 score: 0.8080 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 547 score: 0.8998 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 548 score: 0.7008 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 549 score: 0.9159 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 550 score: 0.8860 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 551 score: 0.9144 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 552 score: 0.9496 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 553 score: 0.9109 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 554 score: 0.9236 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 555 score: 0.8196 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 556 score: 0.8197 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 557 score: 0.8517 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 558 score: 0.8017 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 559 score: 0.8014 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 560 score: 0.8426 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 561 score: 0.9355 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 562 score: 0.7471 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 563 score: 0.6391 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 564 score: 0.8753 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 565 score: 0.9521 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 566 score: 0.8638 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 567 score: 0.8727 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 568 score: 0.8462 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 569 score: 0.6849 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 570 score: 0.8984 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 571 score: 0.9251 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 572 score: 0.7852 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 573 score: 0.9138 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 574 score: 0.9064 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 575 score: 0.9156 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 576 score: 0.8840 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 577 score: 0.9000 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 578 score: 0.8986 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 579 score: 0.9264 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 580 score: 0.8209 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 581 score: 0.8395 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 582 score: 0.8369 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 583 score: 0.9037 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 584 score: 0.6575 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 585 score: 0.9069 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 586 score: 0.8965 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 587 score: 0.8920 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 588 score: 0.8058 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 589 score: 0.9084 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 590 score: 0.9214 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 591 score: 0.9384 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 592 score: 0.7951 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 593 score: 0.9216 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 594 score: 0.9118 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 595 score: 0.9242 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 596 score: 0.8506 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 597 score: 0.9021 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 598 score: 0.8832 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 599 score: 0.9233 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 600 score: 0.9154 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 601 score: 0.8955 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 602 score: 0.9312 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 603 score: 0.9069 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 604 score: 0.9024 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 605 score: 0.9349 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 606 score: 0.8587 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 607 score: 0.7880 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 608 score: 0.6905 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 609 score: 0.8878 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 610 score: 0.9252 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 611 score: 0.9352 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 612 score: 0.9214 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 613 score: 0.8434 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 614 score: 0.8509 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 615 score: 0.8179 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 616 score: 0.9465 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 617 score: 0.9637 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 618 score: 0.9275 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 619 score: 0.8525 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 620 score: 0.7207 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 621 score: 0.7644 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 622 score: 0.9164 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 623 score: 0.8107 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 624 score: 0.8001 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 625 score: 0.9063 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 626 score: 0.9341 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 627 score: 0.8712 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 628 score: 0.9350 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 629 score: 0.9219 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 630 score: 0.9217 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 631 score: 0.8962 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 632 score: 0.9546 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 633 score: 0.9250 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 634 score: 0.9635 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 635 score: 0.9447 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 636 score: 0.9231 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 637 score: 0.8816 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 638 score: 0.8959 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 639 score: 0.9213 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 640 score: 0.8905 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 641 score: 0.9137 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 642 score: 0.8986 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 643 score: 0.7078 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 644 score: 0.8718 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 645 score: 0.7877 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 646 score: 0.8601 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 647 score: 0.8822 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 648 score: 0.8095 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 649 score: 0.8903 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 650 score: 0.9059 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 651 score: 0.9030 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 652 score: 0.5675 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 653 score: 0.7736 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 654 score: 0.7975 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 655 score: 0.9133 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 656 score: 0.7913 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 657 score: 0.8029 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 658 score: 0.7224 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 659 score: 0.8659 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 660 score: 0.7028 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 661 score: 0.9282 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 662 score: 0.8889 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 663 score: 0.8689 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 664 score: 0.9078 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 665 score: 0.8924 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 666 score: 0.9020 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 667 score: 0.7771 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 668 score: 0.8542 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 669 score: 0.8764 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 670 score: 0.8939 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 671 score: 0.8991 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 672 score: 0.9103 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 673 score: 0.9199 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 674 score: 0.9389 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 675 score: 0.8983 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 676 score: 0.9163 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 677 score: 0.9319 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 678 score: 0.6236 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 679 score: 0.9301 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 680 score: 0.8401 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 681 score: 0.9642 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 682 score: 0.9201 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 683 score: 0.8328 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 684 score: 0.8800 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 685 score: 0.8507 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 686 score: 0.8962 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 687 score: 0.9036 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 688 score: 0.8946 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 689 score: 0.8928 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 690 score: 0.9340 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 691 score: 0.9121 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 692 score: 0.9374 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 693 score: 0.9062 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 694 score: 0.7794 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 695 score: 0.8787 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 696 score: 0.8417 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 697 score: 0.9243 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 698 score: 0.7783 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 699 score: 0.9411 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 700 score: 0.9219 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 701 score: 0.9542 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 702 score: 0.9487 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 703 score: 0.7521 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 704 score: 0.9080 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 705 score: 0.8534 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 706 score: 0.8090 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 707 score: 0.9392 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 708 score: 0.9337 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 709 score: 0.9461 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 710 score: 0.9314 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 711 score: 0.8374 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 712 score: 0.9517 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 713 score: 0.8368 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 714 score: 0.8780 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 715 score: 0.8451 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 716 score: 0.8418 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 717 score: 0.8072 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 718 score: 0.9554 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 719 score: 0.9494 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 720 score: 0.8574 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 721 score: 0.9267 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 722 score: 0.9078 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 723 score: 0.9131 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 724 score: 0.8593 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 725 score: 0.9122 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 726 score: 0.8456 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 727 score: 0.8882 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 728 score: 0.8586 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 729 score: 0.7726 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 730 score: 0.8323 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 731 score: 0.7753 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 732 score: 0.8430 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 733 score: 0.9108 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 734 score: 0.8175 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 735 score: 0.9022 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 736 score: 0.8749 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 737 score: 0.9025 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 738 score: 0.9215 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 739 score: 0.8838 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 740 score: 0.9151 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 741 score: 0.8348 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 742 score: 0.8255 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 743 score: 0.9422 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 744 score: 0.9266 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 745 score: 0.8813 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 746 score: 0.9120 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 747 score: 0.8840 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 748 score: 0.9621 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 749 score: 0.8821 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 750 score: 0.8841 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 751 score: 0.8367 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 752 score: 0.8723 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 753 score: 0.8996 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 754 score: 0.9209 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 755 score: 0.9306 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 756 score: 0.8727 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 757 score: 0.8835 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 758 score: 0.8885 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 759 score: 0.8748 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 760 score: 0.9547 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 761 score: 0.8531 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 762 score: 0.9350 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 763 score: 0.8586 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 764 score: 0.9112 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 765 score: 0.6062 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 766 score: 0.8960 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 767 score: 0.8841 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 768 score: 0.9369 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 769 score: 0.9241 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 770 score: 0.9073 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 771 score: 0.8454 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 772 score: 0.8709 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 773 score: 0.9301 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 774 score: 0.8886 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 775 score: 0.8819 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 776 score: 0.8820 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 777 score: 0.8578 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 778 score: 0.9059 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 779 score: 0.8498 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 780 score: 0.8306 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 781 score: 0.7971 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 782 score: 0.8664 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 783 score: 0.7867 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 784 score: 0.9070 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 785 score: 0.6953 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 786 score: 0.9200 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 787 score: 0.9264 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 788 score: 0.8685 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 789 score: 0.9011 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 790 score: 0.8651 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 791 score: 0.8454 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 792 score: 0.8915 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 793 score: 0.9077 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 794 score: 0.8893 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 795 score: 0.8496 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 796 score: 0.9308 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 797 score: 0.8818 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 798 score: 0.2173 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 799 score: 0.7900 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 800 score: 0.8837 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 801 score: 0.8185 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 802 score: 0.8764 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 803 score: 0.8910 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 804 score: 0.8036 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 805 score: 0.8656 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 806 score: 0.9269 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 807 score: 0.8572 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 808 score: 0.8500 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 809 score: 0.8490 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 810 score: 0.7801 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 811 score: 0.7717 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 812 score: 0.9264 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 813 score: 0.9527 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 814 score: 0.8138 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 815 score: 0.8535 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 816 score: 0.9056 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 817 score: 0.7781 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 818 score: 0.6448 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 819 score: 0.8271 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 820 score: 0.9271 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 821 score: 0.8260 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 822 score: 0.8924 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 823 score: 0.8927 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 824 score: 0.9239 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 825 score: 0.8804 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 826 score: 0.8827 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 827 score: 0.9241 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 828 score: 0.8860 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 829 score: 0.8605 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 830 score: 0.8955 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 831 score: 0.8228 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 832 score: 0.8750 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 833 score: 0.7899 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 834 score: 0.8343 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 835 score: 0.8641 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 836 score: 0.6000 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 837 score: 0.7398 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 838 score: 0.8866 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 839 score: 0.9001 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 840 score: 0.8961 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 841 score: 0.8319 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 842 score: 0.5826 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 843 score: 0.8772 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 844 score: 0.7427 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 845 score: 0.5798 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 846 score: 0.6791 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 847 score: 0.8646 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 848 score: 0.8989 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 849 score: 0.8294 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 850 score: 0.7803 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 851 score: 0.8206 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 852 score: 0.9434 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 853 score: 0.8145 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 854 score: 0.7885 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 855 score: 0.8264 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 856 score: 0.7805 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 857 score: 0.9174 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 858 score: 0.8999 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 859 score: 0.8656 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 860 score: 0.8992 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 861 score: 0.8972 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 862 score: 0.8917 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 863 score: 0.9264 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 864 score: 0.8880 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 865 score: 0.8358 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 866 score: 0.8930 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 867 score: 0.9039 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 868 score: 0.9066 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 869 score: 0.8337 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 870 score: 0.8896 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 871 score: 0.9281 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 872 score: 0.8816 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 873 score: 0.8325 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 874 score: 0.9212 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 875 score: 0.8567 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 876 score: 0.8724 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 877 score: 0.8926 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 878 score: 0.9146 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 879 score: 0.8023 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 880 score: 0.8337 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 881 score: 0.9535 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 882 score: 0.9480 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 883 score: 0.8611 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 884 score: 0.7615 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 885 score: 0.9392 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 886 score: 0.9123 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 887 score: 0.6265 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 888 score: 0.7185 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 889 score: 0.8915 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 890 score: 0.7101 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 891 score: 0.7918 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 892 score: 0.6347 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 893 score: 0.7629 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 894 score: 0.9160 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 895 score: 0.8715 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 896 score: 0.9023 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 897 score: 0.7245 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 898 score: 0.9507 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 899 score: 0.7775 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 900 score: 0.7842 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 901 score: 0.9063 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 902 score: 0.6370 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 903 score: 0.8725 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 904 score: 0.9230 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 905 score: 0.8694 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 906 score: 0.8927 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 907 score: 0.9307 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 908 score: 0.8490 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 909 score: 0.9402 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 910 score: 0.7088 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 911 score: 0.8691 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 912 score: 0.9253 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 913 score: 0.8253 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 914 score: 0.8930 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 915 score: 0.8248 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 916 score: 0.9256 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 917 score: 0.2210 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 918 score: 0.9518 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 919 score: 0.8935 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 920 score: 0.9256 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 921 score: 0.9317 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 922 score: 0.7285 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 923 score: 0.8717 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 924 score: 0.9410 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 925 score: 0.8977 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 926 score: 0.9351 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 927 score: 0.8462 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 928 score: 0.9032 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 929 score: 0.8444 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 930 score: 0.9283 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 931 score: 0.9001 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 932 score: 0.7979 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 933 score: 0.8309 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 934 score: 0.7441 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 935 score: 0.7071 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 936 score: 0.9087 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 937 score: 0.9493 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 938 score: 0.9231 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 939 score: 0.8917 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 940 score: 0.9139 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 941 score: 0.9680 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 942 score: 0.9495 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 943 score: 0.9114 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 944 score: 0.8961 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 945 score: 0.9169 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 946 score: 0.8960 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 947 score: 0.8929 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 948 score: 0.8792 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 949 score: 0.9119 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 950 score: 0.8162 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 951 score: 0.7500 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 952 score: 0.6618 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 953 score: 0.8844 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 954 score: 0.6124 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 955 score: 0.9125 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 956 score: 0.9173 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 957 score: 0.9187 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 958 score: 0.8833 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 959 score: 0.9214 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 960 score: 0.8485 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 961 score: 0.8585 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 962 score: 0.9143 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 963 score: 0.8608 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 964 score: 0.8475 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 965 score: 0.7790 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 966 score: 0.8925 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 967 score: 0.7951 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 968 score: 0.7748 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 969 score: 0.8189 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 970 score: 0.8627 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 971 score: 0.8519 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 972 score: 0.8488 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 973 score: 0.8660 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 974 score: 0.6764 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 975 score: 0.9302 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 976 score: 0.8159 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 977 score: 0.7853 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 978 score: 0.9597 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 979 score: 0.9003 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 980 score: 0.8342 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 981 score: 0.8337 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 982 score: 0.9070 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 983 score: 0.7591 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 984 score: 0.8045 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 985 score: 0.8721 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 986 score: 0.9217 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 987 score: 0.8673 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 988 score: 0.8354 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 989 score: 0.5615 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 990 score: 0.9161 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 991 score: 0.6622 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 992 score: 0.9003 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 993 score: 0.7970 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 994 score: 0.9164 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 995 score: 0.7936 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 996 score: 0.9431 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 997 score: 0.9650 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 998 score: 0.8707 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 999 score: 0.7051 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 1000 score: 0.9399 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 1001 score: 0.7990 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 1002 score: 0.8222 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 1003 score: 0.3772 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 1004 score: 0.9218 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 1005 score: 0.9114 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 1006 score: 0.8643 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 1007 score: 0.8812 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 1008 score: 0.9399 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 1009 score: 0.8979 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 1010 score: 0.9040 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu Segment 1011 score: 0.8828 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-hu-max-tokens-512/test-en-hu score: 0.8623