diff --git "a/test-en-ar.comet" "b/test-en-ar.comet" new file mode 100644--- /dev/null +++ "b/test-en-ar.comet" @@ -0,0 +1,1013 @@ +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 0 score: 0.7384 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 1 score: 0.8492 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 2 score: 0.8380 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 3 score: 0.8204 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 4 score: 0.8222 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 5 score: 0.5877 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 6 score: 0.7033 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 7 score: 0.8887 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 8 score: 0.8329 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 9 score: 0.6865 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 10 score: 0.7354 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 11 score: 0.6253 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 12 score: 0.6925 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 13 score: 0.8381 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 14 score: 0.7211 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 15 score: 0.6428 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 16 score: 0.7528 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 17 score: 0.8388 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 18 score: 0.8214 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 19 score: 0.7647 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 20 score: 0.8038 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 21 score: 0.8269 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 22 score: 0.6319 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 23 score: 0.6483 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 24 score: 0.8770 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 25 score: 0.9064 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 26 score: 0.6142 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 27 score: 0.6679 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 28 score: 0.7207 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 29 score: 0.6068 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 30 score: 0.6489 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 31 score: 0.5588 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 32 score: 0.6600 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 33 score: 0.8883 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 34 score: 0.9154 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 35 score: 0.9010 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 36 score: 0.7887 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 37 score: 0.6652 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 38 score: 0.6074 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 39 score: 0.6425 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 40 score: 0.7637 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 41 score: 0.8387 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 42 score: 0.6607 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 43 score: 0.8650 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 44 score: 0.5917 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 45 score: 0.8302 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 46 score: 0.7398 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 47 score: 0.8093 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 48 score: 0.5017 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 49 score: 0.8197 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 50 score: 0.8573 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 51 score: 0.8358 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 52 score: 0.8629 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 53 score: 0.8687 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 54 score: 0.8411 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 55 score: 0.7663 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 56 score: 0.6417 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 57 score: 0.7467 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 58 score: 0.8275 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 59 score: 0.9567 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 60 score: 0.8570 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 61 score: 0.8632 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 62 score: 0.8602 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 63 score: 0.7657 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 64 score: 0.6764 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 65 score: 0.6191 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 66 score: 0.4457 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 67 score: 0.5168 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 68 score: 0.8866 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 69 score: 0.8801 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 70 score: 0.8786 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 71 score: 0.8237 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 72 score: 0.8225 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 73 score: 0.7141 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 74 score: 0.8513 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 75 score: 0.7510 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 76 score: 0.8508 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 77 score: 0.8919 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 78 score: 0.9061 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 79 score: 0.8717 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 80 score: 0.8330 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 81 score: 0.8448 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 82 score: 0.6638 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 83 score: 0.6842 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 84 score: 0.7681 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 85 score: 0.8408 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 86 score: 0.7080 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 87 score: 0.8770 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 88 score: 0.6867 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 89 score: 0.5417 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 90 score: 0.5966 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 91 score: 0.7467 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 92 score: 0.7184 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 93 score: 0.6844 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 94 score: 0.8193 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 95 score: 0.6740 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 96 score: 0.3103 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 97 score: 0.7539 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 98 score: 0.5952 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 99 score: 0.6875 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 100 score: 0.7731 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 101 score: 0.6131 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 102 score: 0.7151 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 103 score: 0.9273 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 104 score: 0.8657 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 105 score: 0.5662 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 106 score: 0.7987 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 107 score: 0.8086 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 108 score: 0.7165 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 109 score: 0.2314 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 110 score: 0.7816 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 111 score: 0.9327 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 112 score: 0.9425 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 113 score: 0.8835 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 114 score: 0.6234 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 115 score: 0.6958 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 116 score: 0.7500 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 117 score: 0.6733 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 118 score: 0.8782 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 119 score: 0.6089 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 120 score: 0.6780 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 121 score: 0.7518 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 122 score: 0.8915 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 123 score: 0.8973 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 124 score: 0.8193 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 125 score: 0.7876 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 126 score: 0.8999 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 127 score: 0.6404 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 128 score: 0.8347 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 129 score: 0.6121 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 130 score: 0.8625 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 131 score: 0.6966 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 132 score: 0.7280 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 133 score: 0.8398 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 134 score: 0.7160 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 135 score: 0.7582 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 136 score: 0.6139 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 137 score: 0.7179 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 138 score: 0.6680 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 139 score: 0.8569 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 140 score: 0.3741 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 141 score: 0.8803 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 142 score: 0.9284 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 143 score: 0.7634 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 144 score: 0.8159 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 145 score: 0.8588 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 146 score: 0.8821 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 147 score: 0.8333 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 148 score: 0.7609 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 149 score: 0.7543 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 150 score: 0.8136 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 151 score: 0.7136 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 152 score: 0.5118 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 153 score: 0.7604 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 154 score: 0.5402 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 155 score: 0.7564 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 156 score: 0.7736 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 157 score: 0.7661 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 158 score: 0.6637 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 159 score: 0.6068 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 160 score: 0.7407 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 161 score: 0.6909 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 162 score: 0.7642 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 163 score: 0.7397 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 164 score: 0.7201 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 165 score: 0.7577 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 166 score: 0.8831 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 167 score: 0.7593 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 168 score: 0.7282 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 169 score: 0.8058 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 170 score: 0.7041 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 171 score: 0.8229 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 172 score: 0.8332 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 173 score: 0.8122 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 174 score: 0.6681 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 175 score: 0.8098 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 176 score: 0.7682 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 177 score: 0.8355 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 178 score: 0.7547 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 179 score: 0.6506 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 180 score: 0.8535 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 181 score: 0.8752 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 182 score: 0.9108 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 183 score: 0.8535 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 184 score: 0.5780 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 185 score: 0.9351 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 186 score: 0.9404 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 187 score: 0.6086 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 188 score: 0.7697 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 189 score: 0.7377 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 190 score: 0.6365 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 191 score: 0.7542 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 192 score: 0.7016 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 193 score: 0.6862 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 194 score: 0.7364 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 195 score: 0.7776 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 196 score: 0.8153 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 197 score: 0.6558 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 198 score: 0.5636 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 199 score: 0.6355 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 200 score: 0.7756 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 201 score: 0.8178 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 202 score: 0.6992 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 203 score: 0.5035 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 204 score: 0.7674 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 205 score: 0.8005 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 206 score: 0.8706 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 207 score: 0.7577 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 208 score: 0.7467 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 209 score: 0.7987 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 210 score: 0.8838 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 211 score: 0.7508 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 212 score: 0.6360 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 213 score: 0.6293 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 214 score: 0.8876 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 215 score: 0.8553 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 216 score: 0.8408 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 217 score: 0.7201 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 218 score: 0.8159 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 219 score: 0.8520 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 220 score: 0.9125 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 221 score: 0.7940 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 222 score: 0.8091 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 223 score: 0.6951 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 224 score: 0.8583 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 225 score: 0.6756 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 226 score: 0.8721 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 227 score: 0.4272 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 228 score: 0.7253 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 229 score: 0.8745 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 230 score: 0.9167 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 231 score: 0.5187 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 232 score: 0.7217 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 233 score: 0.6470 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 234 score: 0.7143 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 235 score: 0.4198 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 236 score: 0.6715 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 237 score: 0.5798 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 238 score: 0.8615 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 239 score: 0.8355 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 240 score: 0.7069 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 241 score: 0.5635 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 242 score: 0.7734 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 243 score: 0.7943 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 244 score: 0.7397 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 245 score: 0.7522 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 246 score: 0.6960 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 247 score: 0.3926 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 248 score: 0.6533 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 249 score: 0.8708 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 250 score: 0.8345 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 251 score: 0.9039 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 252 score: 0.9177 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 253 score: 0.9281 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 254 score: 0.8425 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 255 score: 0.8614 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 256 score: 0.6724 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 257 score: 0.2910 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 258 score: 0.7654 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 259 score: 0.6757 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 260 score: 0.6958 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 261 score: 0.8036 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 262 score: 0.9274 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 263 score: 0.8852 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 264 score: 0.7329 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 265 score: 0.7249 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 266 score: 0.8194 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 267 score: 0.7632 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 268 score: 0.8944 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 269 score: 0.5879 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 270 score: 0.6585 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 271 score: 0.5933 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 272 score: 0.8689 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 273 score: 0.3406 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 274 score: 0.6500 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 275 score: 0.6833 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 276 score: 0.6693 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 277 score: 0.8435 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 278 score: 0.7488 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 279 score: 0.8919 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 280 score: 0.7848 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 281 score: 0.9279 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 282 score: 0.8821 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 283 score: 0.7146 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 284 score: 0.8195 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 285 score: 0.9471 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 286 score: 0.8348 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 287 score: 0.6811 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 288 score: 0.7853 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 289 score: 0.8219 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 290 score: 0.7225 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 291 score: 0.8454 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 292 score: 0.8715 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 293 score: 0.7192 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 294 score: 0.7721 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 295 score: 0.7465 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 296 score: 0.7185 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 297 score: 0.8708 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 298 score: 0.4374 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 299 score: 0.9003 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 300 score: 0.8850 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 301 score: 0.7621 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 302 score: 0.7559 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 303 score: 0.9000 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 304 score: 0.8008 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 305 score: 0.7129 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 306 score: 0.8488 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 307 score: 0.8794 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 308 score: 0.7804 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 309 score: 0.8263 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 310 score: 0.7554 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 311 score: 0.8953 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 312 score: 0.5242 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 313 score: 0.5909 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 314 score: 0.9156 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 315 score: 0.8814 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 316 score: 0.6416 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 317 score: 0.8158 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 318 score: 0.6305 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 319 score: 0.4391 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 320 score: 0.2779 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 321 score: 0.2203 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 322 score: 0.7570 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 323 score: 0.9226 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 324 score: 0.6895 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 325 score: 0.8509 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 326 score: 0.7064 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 327 score: 0.6210 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 328 score: 0.8737 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 329 score: 0.9144 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 330 score: 0.7989 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 331 score: 0.8396 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 332 score: 0.7820 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 333 score: 0.8490 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 334 score: 0.8631 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 335 score: 0.7929 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 336 score: 0.6759 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 337 score: 0.7032 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 338 score: 0.6087 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 339 score: 0.8989 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 340 score: 0.4938 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 341 score: 0.8104 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 342 score: 0.5500 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 343 score: 0.3743 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 344 score: 0.7607 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 345 score: 0.4683 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 346 score: 0.6887 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 347 score: 0.7325 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 348 score: 0.5279 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 349 score: 0.5439 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 350 score: 0.7866 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 351 score: 0.7482 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 352 score: 0.7060 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 353 score: 0.7560 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 354 score: 0.7384 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 355 score: 0.7166 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 356 score: 0.7166 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 357 score: 0.6748 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 358 score: 0.9396 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 359 score: 0.3273 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 360 score: 0.6418 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 361 score: 0.5707 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 362 score: 0.8125 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 363 score: 0.5612 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 364 score: 0.8208 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 365 score: 0.5333 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 366 score: 0.6312 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 367 score: 0.5427 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 368 score: 0.6561 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 369 score: 0.6934 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 370 score: 0.6985 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 371 score: 0.6056 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 372 score: 0.7123 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 373 score: 0.8431 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 374 score: 0.8423 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 375 score: 0.7316 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 376 score: 0.6505 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 377 score: 0.7037 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 378 score: 0.6693 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 379 score: 0.6901 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 380 score: 0.8675 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 381 score: 0.4809 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 382 score: 0.5825 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 383 score: 0.6274 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 384 score: 0.6585 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 385 score: 0.7611 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 386 score: 0.7264 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 387 score: 0.6686 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 388 score: 0.6543 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 389 score: 0.7418 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 390 score: 0.6164 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 391 score: 0.7623 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 392 score: 0.8405 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 393 score: 0.8572 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 394 score: 0.6733 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 395 score: 0.8433 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 396 score: 0.7388 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 397 score: 0.7079 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 398 score: 0.6388 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 399 score: 0.6597 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 400 score: 0.7613 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 401 score: 0.8472 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 402 score: 0.8485 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 403 score: 0.4135 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 404 score: 0.7106 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 405 score: 0.6992 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 406 score: 0.8118 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 407 score: 0.7097 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 408 score: 0.7807 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 409 score: 0.8099 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 410 score: 0.7780 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 411 score: 0.7652 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 412 score: 0.6684 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 413 score: 0.2898 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 414 score: 0.8249 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 415 score: 0.8833 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 416 score: 0.8190 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 417 score: 0.6718 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 418 score: 0.7693 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 419 score: 0.8117 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 420 score: 0.9010 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 421 score: 0.8985 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 422 score: 0.7449 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 423 score: 0.7281 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 424 score: 0.7986 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 425 score: 0.8705 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 426 score: 0.8247 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 427 score: 0.7920 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 428 score: 0.8920 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 429 score: 0.8321 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 430 score: 0.8076 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 431 score: 0.5714 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 432 score: 0.6571 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 433 score: 0.7634 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 434 score: 0.5792 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 435 score: 0.5443 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 436 score: 0.8080 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 437 score: 0.6113 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 438 score: 0.9061 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 439 score: 0.5995 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 440 score: 0.8312 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 441 score: 0.7955 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 442 score: 0.8836 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 443 score: 0.7566 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 444 score: 0.7265 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 445 score: 0.7157 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 446 score: 0.7716 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 447 score: 0.8576 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 448 score: 0.9496 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 449 score: 0.8842 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 450 score: 0.8617 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 451 score: 0.7304 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 452 score: 0.8920 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 453 score: 0.8622 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 454 score: 0.8530 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 455 score: 0.6868 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 456 score: 0.6837 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 457 score: 0.8362 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 458 score: 0.7224 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 459 score: 0.5600 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 460 score: 0.2374 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 461 score: 0.3111 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 462 score: 0.8501 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 463 score: 0.6464 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 464 score: 0.6075 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 465 score: 0.7901 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 466 score: 0.8216 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 467 score: 0.5378 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 468 score: 0.5309 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 469 score: 0.2780 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 470 score: 0.7640 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 471 score: 0.7189 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 472 score: 0.7569 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 473 score: 0.7635 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 474 score: 0.6215 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 475 score: 0.8156 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 476 score: 0.2840 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 477 score: 0.9201 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 478 score: 0.5793 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 479 score: 0.7985 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 480 score: 0.7804 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 481 score: 0.3513 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 482 score: 0.6702 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 483 score: 0.6652 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 484 score: 0.3787 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 485 score: 0.8001 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 486 score: 0.7651 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 487 score: 0.7884 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 488 score: 0.8347 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 489 score: 0.7497 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 490 score: 0.7101 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 491 score: 0.6720 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 492 score: 0.7143 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 493 score: 0.8029 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 494 score: 0.8754 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 495 score: 0.7546 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 496 score: 0.6663 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 497 score: 0.6564 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 498 score: 0.7641 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 499 score: 0.5279 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 500 score: 0.8922 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 501 score: 0.8240 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 502 score: 0.7170 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 503 score: 0.6633 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 504 score: 0.6794 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 505 score: 0.5788 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 506 score: 0.6281 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 507 score: 0.7212 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 508 score: 0.7905 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 509 score: 0.8604 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 510 score: 0.5562 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 511 score: 0.6583 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 512 score: 0.7614 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 513 score: 0.7023 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 514 score: 0.8717 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 515 score: 0.7752 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 516 score: 0.6615 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 517 score: 0.8892 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 518 score: 0.8631 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 519 score: 0.8545 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 520 score: 0.7815 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 521 score: 0.8651 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 522 score: 0.8489 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 523 score: 0.2433 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 524 score: 0.7132 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 525 score: 0.7619 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 526 score: 0.5299 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 527 score: 0.2428 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 528 score: 0.5895 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 529 score: 0.9141 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 530 score: 0.5863 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 531 score: 0.3544 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 532 score: 0.5968 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 533 score: 0.7977 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 534 score: 0.6601 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 535 score: 0.7086 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 536 score: 0.3590 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 537 score: 0.7289 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 538 score: 0.8744 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 539 score: 0.6703 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 540 score: 0.8191 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 541 score: 0.8419 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 542 score: 0.6180 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 543 score: 0.6605 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 544 score: 0.7844 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 545 score: 0.9622 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 546 score: 0.8211 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 547 score: 0.7355 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 548 score: 0.6926 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 549 score: 0.7574 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 550 score: 0.7241 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 551 score: 0.9012 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 552 score: 0.6916 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 553 score: 0.6252 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 554 score: 0.8426 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 555 score: 0.7915 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 556 score: 0.5658 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 557 score: 0.8956 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 558 score: 0.3925 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 559 score: 0.7334 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 560 score: 0.7035 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 561 score: 0.8644 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 562 score: 0.7911 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 563 score: 0.7219 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 564 score: 0.6929 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 565 score: 0.8749 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 566 score: 0.7205 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 567 score: 0.8795 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 568 score: 0.7865 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 569 score: 0.6858 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 570 score: 0.9062 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 571 score: 0.8510 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 572 score: 0.6012 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 573 score: 0.6437 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 574 score: 0.8061 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 575 score: 0.7914 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 576 score: 0.4119 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 577 score: 0.6461 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 578 score: 0.8327 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 579 score: 0.7209 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 580 score: 0.8004 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 581 score: 0.5980 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 582 score: 0.8770 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 583 score: 0.5582 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 584 score: 0.5432 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 585 score: 0.7844 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 586 score: 0.7409 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 587 score: 0.7378 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 588 score: 0.6806 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 589 score: 0.8375 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 590 score: 0.6869 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 591 score: 0.8263 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 592 score: 0.7875 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 593 score: 0.8729 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 594 score: 0.8698 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 595 score: 0.7362 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 596 score: 0.7235 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 597 score: 0.6646 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 598 score: 0.5927 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 599 score: 0.6279 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 600 score: 0.6043 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 601 score: 0.6336 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 602 score: 0.3273 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 603 score: 0.7323 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 604 score: 0.5951 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 605 score: 0.7593 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 606 score: 0.6724 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 607 score: 0.7395 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 608 score: 0.7093 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 609 score: 0.2191 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 610 score: 0.7162 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 611 score: 0.8164 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 612 score: 0.8283 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 613 score: 0.7605 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 614 score: 0.5890 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 615 score: 0.5614 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 616 score: 0.7976 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 617 score: 0.9431 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 618 score: 0.8218 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 619 score: 0.2945 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 620 score: 0.7128 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 621 score: 0.4950 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 622 score: 0.8542 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 623 score: 0.8476 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 624 score: 0.7944 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 625 score: 0.8067 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 626 score: 0.8755 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 627 score: 0.6101 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 628 score: 0.9452 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 629 score: 0.7217 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 630 score: 0.6973 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 631 score: 0.9151 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 632 score: 0.6707 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 633 score: 0.8975 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 634 score: 0.8562 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 635 score: 0.8644 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 636 score: 0.7358 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 637 score: 0.5905 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 638 score: 0.6582 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 639 score: 0.9217 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 640 score: 0.8502 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 641 score: 0.8382 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 642 score: 0.5237 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 643 score: 0.6529 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 644 score: 0.5292 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 645 score: 0.7010 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 646 score: 0.5702 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 647 score: 0.8494 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 648 score: 0.6161 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 649 score: 0.5952 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 650 score: 0.7496 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 651 score: 0.8382 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 652 score: 0.5885 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 653 score: 0.6471 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 654 score: 0.7556 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 655 score: 0.7830 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 656 score: 0.8567 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 657 score: 0.7342 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 658 score: 0.5240 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 659 score: 0.6156 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 660 score: 0.6435 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 661 score: 0.8553 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 662 score: 0.8918 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 663 score: 0.8200 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 664 score: 0.7943 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 665 score: 0.7321 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 666 score: 0.3064 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 667 score: 0.8724 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 668 score: 0.8192 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 669 score: 0.8734 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 670 score: 0.2637 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 671 score: 0.8515 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 672 score: 0.8819 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 673 score: 0.6074 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 674 score: 0.7665 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 675 score: 0.7388 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 676 score: 0.7145 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 677 score: 0.8439 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 678 score: 0.7825 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 679 score: 0.7382 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 680 score: 0.8304 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 681 score: 0.9035 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 682 score: 0.8627 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 683 score: 0.7204 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 684 score: 0.8157 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 685 score: 0.7302 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 686 score: 0.8750 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 687 score: 0.7633 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 688 score: 0.7127 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 689 score: 0.7538 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 690 score: 0.8437 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 691 score: 0.8424 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 692 score: 0.8455 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 693 score: 0.6657 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 694 score: 0.6193 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 695 score: 0.7582 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 696 score: 0.7187 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 697 score: 0.7702 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 698 score: 0.6662 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 699 score: 0.9219 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 700 score: 0.7671 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 701 score: 0.8552 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 702 score: 0.8029 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 703 score: 0.6730 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 704 score: 0.5807 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 705 score: 0.7200 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 706 score: 0.3112 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 707 score: 0.8669 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 708 score: 0.8262 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 709 score: 0.7888 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 710 score: 0.7759 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 711 score: 0.6544 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 712 score: 0.9015 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 713 score: 0.7068 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 714 score: 0.8537 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 715 score: 0.8233 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 716 score: 0.8325 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 717 score: 0.7009 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 718 score: 0.8199 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 719 score: 0.9045 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 720 score: 0.8082 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 721 score: 0.6570 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 722 score: 0.8320 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 723 score: 0.8142 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 724 score: 0.7369 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 725 score: 0.6712 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 726 score: 0.7402 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 727 score: 0.8539 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 728 score: 0.6256 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 729 score: 0.7147 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 730 score: 0.8088 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 731 score: 0.8944 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 732 score: 0.1810 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 733 score: 0.8212 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 734 score: 0.6624 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 735 score: 0.8674 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 736 score: 0.8551 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 737 score: 0.7942 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 738 score: 0.9187 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 739 score: 0.9144 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 740 score: 0.8981 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 741 score: 0.8209 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 742 score: 0.8098 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 743 score: 0.8982 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 744 score: 0.6229 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 745 score: 0.5658 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 746 score: 0.8523 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 747 score: 0.2099 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 748 score: 0.8022 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 749 score: 0.9242 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 750 score: 0.8498 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 751 score: 0.8513 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 752 score: 0.7844 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 753 score: 0.8887 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 754 score: 0.8982 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 755 score: 0.8774 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 756 score: 0.8203 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 757 score: 0.7639 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 758 score: 0.8409 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 759 score: 0.7047 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 760 score: 0.8792 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 761 score: 0.6956 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 762 score: 0.6570 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 763 score: 0.8602 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 764 score: 0.8649 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 765 score: 0.5377 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 766 score: 0.7004 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 767 score: 0.7780 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 768 score: 0.8660 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 769 score: 0.8794 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 770 score: 0.8365 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 771 score: 0.7094 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 772 score: 0.7706 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 773 score: 0.8098 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 774 score: 0.8954 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 775 score: 0.7571 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 776 score: 0.7611 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 777 score: 0.7253 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 778 score: 0.7575 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 779 score: 0.7395 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 780 score: 0.7214 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 781 score: 0.8127 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 782 score: 0.6443 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 783 score: 0.7788 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 784 score: 0.7263 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 785 score: 0.5410 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 786 score: 0.5994 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 787 score: 0.7704 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 788 score: 0.5934 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 789 score: 0.7369 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 790 score: 0.6948 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 791 score: 0.8451 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 792 score: 0.9044 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 793 score: 0.8672 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 794 score: 0.7515 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 795 score: 0.8487 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 796 score: 0.8191 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 797 score: 0.6270 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 798 score: 0.7518 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 799 score: 0.7327 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 800 score: 0.7895 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 801 score: 0.6651 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 802 score: 0.2305 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 803 score: 0.7559 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 804 score: 0.4994 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 805 score: 0.6815 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 806 score: 0.7041 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 807 score: 0.6934 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 808 score: 0.7502 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 809 score: 0.5733 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 810 score: 0.4652 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 811 score: 0.3571 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 812 score: 0.7715 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 813 score: 0.8243 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 814 score: 0.8106 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 815 score: 0.7577 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 816 score: 0.8359 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 817 score: 0.4874 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 818 score: 0.6633 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 819 score: 0.5790 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 820 score: 0.7352 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 821 score: 0.5920 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 822 score: 0.8670 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 823 score: 0.8260 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 824 score: 0.5213 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 825 score: 0.5170 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 826 score: 0.6976 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 827 score: 0.7754 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 828 score: 0.6597 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 829 score: 0.6166 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 830 score: 0.7986 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 831 score: 0.8031 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 832 score: 0.6970 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 833 score: 0.2214 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 834 score: 0.5640 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 835 score: 0.6325 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 836 score: 0.5402 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 837 score: 0.6459 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 838 score: 0.6639 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 839 score: 0.7332 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 840 score: 0.8574 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 841 score: 0.3401 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 842 score: 0.5089 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 843 score: 0.6445 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 844 score: 0.6415 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 845 score: 0.5625 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 846 score: 0.3328 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 847 score: 0.7996 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 848 score: 0.5845 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 849 score: 0.2145 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 850 score: 0.6651 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 851 score: 0.8362 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 852 score: 0.7882 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 853 score: 0.5281 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 854 score: 0.3897 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 855 score: 0.5233 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 856 score: 0.6916 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 857 score: 0.8296 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 858 score: 0.8254 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 859 score: 0.7357 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 860 score: 0.8362 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 861 score: 0.7626 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 862 score: 0.8905 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 863 score: 0.6764 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 864 score: 0.7711 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 865 score: 0.7706 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 866 score: 0.8873 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 867 score: 0.6385 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 868 score: 0.8324 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 869 score: 0.6992 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 870 score: 0.8450 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 871 score: 0.7635 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 872 score: 0.6735 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 873 score: 0.8165 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 874 score: 0.8240 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 875 score: 0.7987 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 876 score: 0.4214 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 877 score: 0.7764 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 878 score: 0.9179 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 879 score: 0.7158 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 880 score: 0.8886 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 881 score: 0.8318 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 882 score: 0.8676 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 883 score: 0.9026 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 884 score: 0.7759 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 885 score: 0.5767 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 886 score: 0.8141 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 887 score: 0.5887 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 888 score: 0.5192 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 889 score: 0.5637 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 890 score: 0.5563 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 891 score: 0.5171 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 892 score: 0.6519 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 893 score: 0.6769 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 894 score: 0.6864 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 895 score: 0.9133 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 896 score: 0.7880 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 897 score: 0.8599 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 898 score: 0.9051 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 899 score: 0.7649 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 900 score: 0.7215 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 901 score: 0.6969 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 902 score: 0.4933 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 903 score: 0.6563 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 904 score: 0.8955 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 905 score: 0.2392 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 906 score: 0.7055 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 907 score: 0.7623 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 908 score: 0.7923 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 909 score: 0.7627 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 910 score: 0.6885 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 911 score: 0.8425 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 912 score: 0.8274 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 913 score: 0.8216 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 914 score: 0.6561 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 915 score: 0.7952 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 916 score: 0.8282 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 917 score: 0.8932 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 918 score: 0.7571 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 919 score: 0.7936 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 920 score: 0.6358 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 921 score: 0.7525 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 922 score: 0.8815 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 923 score: 0.8982 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 924 score: 0.8274 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 925 score: 0.8223 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 926 score: 0.8484 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 927 score: 0.7206 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 928 score: 0.8505 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 929 score: 0.7677 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 930 score: 0.8535 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 931 score: 0.6412 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 932 score: 0.6023 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 933 score: 0.7828 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 934 score: 0.6538 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 935 score: 0.2661 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 936 score: 0.3734 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 937 score: 0.9514 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 938 score: 0.8859 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 939 score: 0.9071 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 940 score: 0.8572 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 941 score: 0.9600 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 942 score: 0.8716 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 943 score: 0.7666 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 944 score: 0.6980 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 945 score: 0.8445 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 946 score: 0.5426 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 947 score: 0.8052 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 948 score: 0.7080 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 949 score: 0.7131 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 950 score: 0.7357 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 951 score: 0.8742 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 952 score: 0.6114 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 953 score: 0.6406 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 954 score: 0.5316 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 955 score: 0.8934 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 956 score: 0.7884 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 957 score: 0.9226 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 958 score: 0.8131 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 959 score: 0.6656 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 960 score: 0.6460 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 961 score: 0.6277 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 962 score: 0.3456 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 963 score: 0.7563 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 964 score: 0.9259 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 965 score: 0.7947 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 966 score: 0.6380 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 967 score: 0.5460 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 968 score: 0.6900 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 969 score: 0.6654 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 970 score: 0.6845 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 971 score: 0.6343 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 972 score: 0.6515 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 973 score: 0.8542 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 974 score: 0.7890 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 975 score: 0.5207 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 976 score: 0.7468 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 977 score: 0.7349 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 978 score: 0.7111 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 979 score: 0.8825 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 980 score: 0.8153 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 981 score: 0.8137 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 982 score: 0.8168 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 983 score: 0.7678 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 984 score: 0.5281 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 985 score: 0.2508 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 986 score: 0.4830 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 987 score: 0.5917 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 988 score: 0.7347 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 989 score: 0.7339 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 990 score: 0.8862 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 991 score: 0.6325 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 992 score: 0.8510 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 993 score: 0.8359 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 994 score: 0.7780 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 995 score: 0.7829 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 996 score: 0.5673 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 997 score: 0.4822 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 998 score: 0.8877 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 999 score: 0.5747 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 1000 score: 0.7875 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 1001 score: 0.6407 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 1002 score: 0.8243 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 1003 score: 0.7244 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 1004 score: 0.3924 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 1005 score: 0.8881 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 1006 score: 0.6561 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 1007 score: 0.5591 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 1008 score: 0.5866 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 1009 score: 0.8081 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 1010 score: 0.8442 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar Segment 1011 score: 0.8572 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_50_languages/seperate_training//alma-13b-sft-50-languages-ar-max-tokens-512/test-en-ar score: 0.7300