diff --git "a/test-en-lv.comet" "b/test-en-lv.comet" new file mode 100644--- /dev/null +++ "b/test-en-lv.comet" @@ -0,0 +1,1013 @@ +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 0 score: 0.6505 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 1 score: 0.7756 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 2 score: 0.5581 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 3 score: 0.7493 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 4 score: 0.4659 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 5 score: 0.5162 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 6 score: 0.6491 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 7 score: 0.6916 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 8 score: 0.8673 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 9 score: 0.5251 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 10 score: 0.5259 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 11 score: 0.6359 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 12 score: 0.6571 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 13 score: 0.3079 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 14 score: 0.7120 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 15 score: 0.6424 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 16 score: 0.3106 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 17 score: 0.7110 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 18 score: 0.8250 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 19 score: 0.4612 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 20 score: 0.9440 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 21 score: 0.6139 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 22 score: 0.5880 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 23 score: 0.7822 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 24 score: 0.6813 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 25 score: 0.7400 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 26 score: 0.5157 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 27 score: 0.6810 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 28 score: 0.5014 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 29 score: 0.6021 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 30 score: 0.4866 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 31 score: 0.6135 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 32 score: 0.6994 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 33 score: 0.8437 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 34 score: 0.8960 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 35 score: 0.8306 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 36 score: 0.7084 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 37 score: 0.8258 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 38 score: 0.8189 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 39 score: 0.5629 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 40 score: 0.4948 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 41 score: 0.9553 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 42 score: 0.7937 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 43 score: 0.8831 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 44 score: 0.5282 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 45 score: 0.5588 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 46 score: 0.8270 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 47 score: 0.6106 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 48 score: 0.4476 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 49 score: 0.8247 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 50 score: 0.9423 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 51 score: 0.4684 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 52 score: 0.6505 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 53 score: 0.6702 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 54 score: 0.7083 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 55 score: 0.7944 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 56 score: 0.7146 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 57 score: 0.6575 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 58 score: 0.7022 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 59 score: 0.5739 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 60 score: 0.6113 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 61 score: 0.7882 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 62 score: 0.7628 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 63 score: 0.6559 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 64 score: 0.6657 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 65 score: 0.5151 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 66 score: 0.6774 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 67 score: 0.5266 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 68 score: 0.7919 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 69 score: 0.9123 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 70 score: 0.5590 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 71 score: 0.4400 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 72 score: 0.6894 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 73 score: 0.6298 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 74 score: 0.8064 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 75 score: 0.7221 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 76 score: 0.6131 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 77 score: 0.5784 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 78 score: 0.8298 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 79 score: 0.7695 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 80 score: 0.6741 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 81 score: 0.5898 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 82 score: 0.5942 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 83 score: 0.4365 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 84 score: 0.4754 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 85 score: 0.5730 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 86 score: 0.4290 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 87 score: 0.5721 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 88 score: 0.7990 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 89 score: 0.6604 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 90 score: 0.5769 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 91 score: 0.7821 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 92 score: 0.2884 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 93 score: 0.4964 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 94 score: 0.4848 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 95 score: 0.8506 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 96 score: 0.4804 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 97 score: 0.8788 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 98 score: 0.7366 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 99 score: 0.8769 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 100 score: 0.9262 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 101 score: 0.7710 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 102 score: 0.7228 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 103 score: 0.9431 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 104 score: 0.6624 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 105 score: 0.7751 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 106 score: 0.8762 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 107 score: 0.6475 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 108 score: 0.4058 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 109 score: 0.5189 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 110 score: 0.5266 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 111 score: 0.5304 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 112 score: 0.8284 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 113 score: 0.4567 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 114 score: 0.4669 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 115 score: 0.5475 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 116 score: 0.6587 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 117 score: 0.6481 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 118 score: 0.9089 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 119 score: 0.6410 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 120 score: 0.5625 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 121 score: 0.7606 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 122 score: 0.6594 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 123 score: 0.8759 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 124 score: 0.5611 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 125 score: 0.5185 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 126 score: 0.8971 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 127 score: 0.4665 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 128 score: 0.5868 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 129 score: 0.2708 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 130 score: 0.4498 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 131 score: 0.5664 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 132 score: 0.4751 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 133 score: 0.5617 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 134 score: 0.5632 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 135 score: 0.3863 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 136 score: 0.4067 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 137 score: 0.6609 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 138 score: 0.7363 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 139 score: 0.4974 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 140 score: 0.7793 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 141 score: 0.5454 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 142 score: 0.6670 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 143 score: 0.6388 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 144 score: 0.7081 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 145 score: 0.6750 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 146 score: 0.7552 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 147 score: 0.8933 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 148 score: 0.8023 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 149 score: 0.4759 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 150 score: 0.8948 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 151 score: 0.7028 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 152 score: 0.7403 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 153 score: 0.7020 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 154 score: 0.2171 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 155 score: 0.6957 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 156 score: 0.4655 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 157 score: 0.5487 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 158 score: 0.5874 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 159 score: 0.6221 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 160 score: 0.3875 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 161 score: 0.6722 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 162 score: 0.4277 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 163 score: 0.2317 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 164 score: 0.8578 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 165 score: 0.5328 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 166 score: 0.3623 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 167 score: 0.5406 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 168 score: 0.4700 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 169 score: 0.5478 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 170 score: 0.6990 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 171 score: 0.6983 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 172 score: 0.7015 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 173 score: 0.5552 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 174 score: 0.7321 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 175 score: 0.6779 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 176 score: 0.7174 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 177 score: 0.6610 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 178 score: 0.5829 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 179 score: 0.7432 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 180 score: 0.8900 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 181 score: 0.8929 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 182 score: 0.7970 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 183 score: 0.8927 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 184 score: 0.4799 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 185 score: 0.6669 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 186 score: 0.7170 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 187 score: 0.9264 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 188 score: 0.6468 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 189 score: 0.5411 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 190 score: 0.6767 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 191 score: 0.6325 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 192 score: 0.6502 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 193 score: 0.7162 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 194 score: 0.5658 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 195 score: 0.8607 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 196 score: 0.5090 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 197 score: 0.6034 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 198 score: 0.4422 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 199 score: 0.6689 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 200 score: 0.4746 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 201 score: 0.5341 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 202 score: 0.4345 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 203 score: 0.3050 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 204 score: 0.4137 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 205 score: 0.7091 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 206 score: 0.5735 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 207 score: 0.5717 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 208 score: 0.6641 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 209 score: 0.9434 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 210 score: 0.6792 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 211 score: 0.7340 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 212 score: 0.6653 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 213 score: 0.8374 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 214 score: 0.8670 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 215 score: 0.6435 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 216 score: 0.7499 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 217 score: 0.6246 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 218 score: 0.6298 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 219 score: 0.5586 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 220 score: 0.8966 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 221 score: 0.4111 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 222 score: 0.5750 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 223 score: 0.4881 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 224 score: 0.4431 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 225 score: 0.7137 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 226 score: 0.5223 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 227 score: 0.5994 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 228 score: 0.7304 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 229 score: 0.8949 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 230 score: 0.8892 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 231 score: 0.6284 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 232 score: 0.7463 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 233 score: 0.9011 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 234 score: 0.5522 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 235 score: 0.7261 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 236 score: 0.7411 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 237 score: 0.7095 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 238 score: 0.7850 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 239 score: 0.7248 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 240 score: 0.4809 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 241 score: 0.4794 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 242 score: 0.8485 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 243 score: 0.4357 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 244 score: 0.4566 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 245 score: 0.5248 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 246 score: 0.5490 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 247 score: 0.4964 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 248 score: 0.3022 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 249 score: 0.9043 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 250 score: 0.2234 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 251 score: 0.9432 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 252 score: 0.5338 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 253 score: 0.2026 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 254 score: 0.6273 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 255 score: 0.8446 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 256 score: 0.5665 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 257 score: 0.6295 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 258 score: 0.8607 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 259 score: 0.5907 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 260 score: 0.7438 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 261 score: 0.6061 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 262 score: 0.3528 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 263 score: 0.4934 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 264 score: 0.7236 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 265 score: 0.3751 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 266 score: 0.6159 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 267 score: 0.7251 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 268 score: 0.8221 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 269 score: 0.8274 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 270 score: 0.5552 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 271 score: 0.4215 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 272 score: 0.8796 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 273 score: 0.5511 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 274 score: 0.4935 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 275 score: 0.6704 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 276 score: 0.4830 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 277 score: 0.5322 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 278 score: 0.5195 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 279 score: 0.7772 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 280 score: 0.6670 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 281 score: 0.7856 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 282 score: 0.4785 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 283 score: 0.5622 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 284 score: 0.8824 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 285 score: 0.9321 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 286 score: 0.5097 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 287 score: 0.5046 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 288 score: 0.7220 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 289 score: 0.5332 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 290 score: 0.5988 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 291 score: 0.7945 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 292 score: 0.5168 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 293 score: 0.2883 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 294 score: 0.4647 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 295 score: 0.6539 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 296 score: 0.5416 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 297 score: 0.6919 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 298 score: 0.6750 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 299 score: 0.8844 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 300 score: 0.7938 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 301 score: 0.8654 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 302 score: 0.4462 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 303 score: 0.8947 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 304 score: 0.5999 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 305 score: 0.8117 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 306 score: 0.8523 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 307 score: 0.8491 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 308 score: 0.8833 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 309 score: 0.7796 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 310 score: 0.9220 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 311 score: 0.5240 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 312 score: 0.6398 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 313 score: 0.5468 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 314 score: 0.4497 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 315 score: 0.9244 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 316 score: 0.5401 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 317 score: 0.6908 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 318 score: 0.7729 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 319 score: 0.6520 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 320 score: 0.6635 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 321 score: 0.6566 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 322 score: 0.4103 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 323 score: 0.2952 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 324 score: 0.6234 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 325 score: 0.7522 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 326 score: 0.5492 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 327 score: 0.5171 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 328 score: 0.6596 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 329 score: 0.5947 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 330 score: 0.5968 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 331 score: 0.8356 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 332 score: 0.5986 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 333 score: 0.4130 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 334 score: 0.8452 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 335 score: 0.5779 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 336 score: 0.6830 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 337 score: 0.5557 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 338 score: 0.6117 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 339 score: 0.7817 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 340 score: 0.2251 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 341 score: 0.4840 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 342 score: 0.3107 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 343 score: 0.4688 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 344 score: 0.5884 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 345 score: 0.5576 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 346 score: 0.6568 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 347 score: 0.7908 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 348 score: 0.3641 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 349 score: 0.3784 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 350 score: 0.7523 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 351 score: 0.4804 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 352 score: 0.6183 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 353 score: 0.7077 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 354 score: 0.7099 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 355 score: 0.5697 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 356 score: 0.6788 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 357 score: 0.4610 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 358 score: 0.7901 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 359 score: 0.5366 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 360 score: 0.4189 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 361 score: 0.5477 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 362 score: 0.5818 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 363 score: 0.4447 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 364 score: 0.5009 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 365 score: 0.4172 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 366 score: 0.5249 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 367 score: 0.6004 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 368 score: 0.2257 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 369 score: 0.3213 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 370 score: 0.4711 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 371 score: 0.4338 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 372 score: 0.5425 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 373 score: 0.6407 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 374 score: 0.8921 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 375 score: 0.4601 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 376 score: 0.8287 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 377 score: 0.8750 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 378 score: 0.4700 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 379 score: 0.5039 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 380 score: 0.4394 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 381 score: 0.4052 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 382 score: 0.4624 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 383 score: 0.5936 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 384 score: 0.7229 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 385 score: 0.4867 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 386 score: 0.4709 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 387 score: 0.3981 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 388 score: 0.5113 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 389 score: 0.4984 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 390 score: 0.5620 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 391 score: 0.5143 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 392 score: 0.4546 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 393 score: 0.4653 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 394 score: 0.4492 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 395 score: 0.8101 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 396 score: 0.4153 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 397 score: 0.6574 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 398 score: 0.4585 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 399 score: 0.3403 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 400 score: 0.8235 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 401 score: 0.7559 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 402 score: 0.5821 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 403 score: 0.5728 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 404 score: 0.4665 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 405 score: 0.8826 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 406 score: 0.6914 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 407 score: 0.6770 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 408 score: 0.9340 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 409 score: 0.6375 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 410 score: 0.8010 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 411 score: 0.7546 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 412 score: 0.5154 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 413 score: 0.8124 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 414 score: 0.5084 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 415 score: 0.6096 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 416 score: 0.8908 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 417 score: 0.5191 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 418 score: 0.8380 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 419 score: 0.8713 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 420 score: 0.8226 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 421 score: 0.9200 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 422 score: 0.5866 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 423 score: 0.8229 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 424 score: 0.6044 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 425 score: 0.8604 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 426 score: 0.8684 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 427 score: 0.8524 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 428 score: 0.5591 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 429 score: 0.9274 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 430 score: 0.8352 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 431 score: 0.6526 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 432 score: 0.7251 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 433 score: 0.5673 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 434 score: 0.4653 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 435 score: 0.4649 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 436 score: 0.4775 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 437 score: 0.7571 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 438 score: 0.6816 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 439 score: 0.5184 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 440 score: 0.7693 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 441 score: 0.4420 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 442 score: 0.6847 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 443 score: 0.7002 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 444 score: 0.6087 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 445 score: 0.4782 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 446 score: 0.6776 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 447 score: 0.5219 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 448 score: 0.8902 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 449 score: 0.5316 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 450 score: 0.4554 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 451 score: 0.7372 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 452 score: 0.5345 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 453 score: 0.5995 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 454 score: 0.8731 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 455 score: 0.8386 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 456 score: 0.4916 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 457 score: 0.5001 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 458 score: 0.5550 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 459 score: 0.4402 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 460 score: 0.4794 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 461 score: 0.2700 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 462 score: 0.1954 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 463 score: 0.6902 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 464 score: 0.7209 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 465 score: 0.6774 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 466 score: 0.8408 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 467 score: 0.4843 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 468 score: 0.4753 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 469 score: 0.2827 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 470 score: 0.5950 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 471 score: 0.5821 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 472 score: 0.5201 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 473 score: 0.3419 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 474 score: 0.4042 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 475 score: 0.5310 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 476 score: 0.7303 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 477 score: 0.1939 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 478 score: 0.6585 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 479 score: 0.2178 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 480 score: 0.4376 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 481 score: 0.5344 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 482 score: 0.6247 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 483 score: 0.8474 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 484 score: 0.7618 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 485 score: 0.5293 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 486 score: 0.8561 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 487 score: 0.5518 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 488 score: 0.8006 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 489 score: 0.7676 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 490 score: 0.4913 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 491 score: 0.7081 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 492 score: 0.9230 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 493 score: 0.8634 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 494 score: 0.5738 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 495 score: 0.5032 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 496 score: 0.6051 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 497 score: 0.5836 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 498 score: 0.4753 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 499 score: 0.5255 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 500 score: 0.7355 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 501 score: 0.8473 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 502 score: 0.6782 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 503 score: 0.5227 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 504 score: 0.5481 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 505 score: 0.3868 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 506 score: 0.4749 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 507 score: 0.4894 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 508 score: 0.5943 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 509 score: 0.6542 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 510 score: 0.4750 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 511 score: 0.3172 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 512 score: 0.4659 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 513 score: 0.6134 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 514 score: 0.7525 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 515 score: 0.6795 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 516 score: 0.6071 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 517 score: 0.9275 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 518 score: 0.6317 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 519 score: 0.9282 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 520 score: 0.8001 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 521 score: 0.8550 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 522 score: 0.5006 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 523 score: 0.5424 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 524 score: 0.3168 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 525 score: 0.6485 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 526 score: 0.6102 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 527 score: 0.5653 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 528 score: 0.4198 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 529 score: 0.4862 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 530 score: 0.4190 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 531 score: 0.6467 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 532 score: 0.4026 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 533 score: 0.5179 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 534 score: 0.4290 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 535 score: 0.4608 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 536 score: 0.2200 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 537 score: 0.3794 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 538 score: 0.6018 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 539 score: 0.5321 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 540 score: 0.6816 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 541 score: 0.8031 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 542 score: 0.6936 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 543 score: 0.7749 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 544 score: 0.7228 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 545 score: 0.5429 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 546 score: 0.6835 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 547 score: 0.6270 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 548 score: 0.5973 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 549 score: 0.6402 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 550 score: 0.5927 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 551 score: 0.8324 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 552 score: 0.8436 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 553 score: 0.5343 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 554 score: 0.4572 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 555 score: 0.3367 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 556 score: 0.1426 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 557 score: 0.9256 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 558 score: 0.4456 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 559 score: 0.3816 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 560 score: 0.4131 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 561 score: 0.4993 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 562 score: 0.5613 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 563 score: 0.2713 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 564 score: 0.5027 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 565 score: 0.6163 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 566 score: 0.7706 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 567 score: 0.5505 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 568 score: 0.5315 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 569 score: 0.7172 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 570 score: 0.7083 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 571 score: 0.7354 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 572 score: 0.5036 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 573 score: 0.5921 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 574 score: 0.4811 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 575 score: 0.4419 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 576 score: 0.4054 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 577 score: 0.6340 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 578 score: 0.7707 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 579 score: 0.4878 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 580 score: 0.5176 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 581 score: 0.6638 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 582 score: 0.7737 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 583 score: 0.5730 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 584 score: 0.4317 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 585 score: 0.6341 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 586 score: 0.6252 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 587 score: 0.9486 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 588 score: 0.6607 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 589 score: 0.9107 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 590 score: 0.7538 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 591 score: 0.8415 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 592 score: 0.6100 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 593 score: 0.9593 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 594 score: 0.8800 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 595 score: 0.5261 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 596 score: 0.4386 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 597 score: 0.5496 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 598 score: 0.3927 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 599 score: 0.7846 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 600 score: 0.8349 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 601 score: 0.7275 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 602 score: 0.2890 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 603 score: 0.6114 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 604 score: 0.5176 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 605 score: 0.5032 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 606 score: 0.7053 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 607 score: 0.5733 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 608 score: 0.7130 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 609 score: 0.6036 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 610 score: 0.5933 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 611 score: 0.5043 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 612 score: 0.6240 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 613 score: 0.6563 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 614 score: 0.4689 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 615 score: 0.4189 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 616 score: 0.7131 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 617 score: 0.8072 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 618 score: 0.5256 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 619 score: 0.5457 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 620 score: 0.5090 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 621 score: 0.5116 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 622 score: 0.4928 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 623 score: 0.4834 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 624 score: 0.2818 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 625 score: 0.5993 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 626 score: 0.5047 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 627 score: 0.8452 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 628 score: 0.7385 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 629 score: 0.4527 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 630 score: 0.4998 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 631 score: 0.9138 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 632 score: 0.9331 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 633 score: 0.8719 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 634 score: 0.9723 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 635 score: 0.6078 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 636 score: 0.6606 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 637 score: 0.6135 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 638 score: 0.7130 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 639 score: 0.7739 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 640 score: 0.6435 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 641 score: 0.7508 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 642 score: 0.4942 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 643 score: 0.5183 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 644 score: 0.5048 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 645 score: 0.6408 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 646 score: 0.6534 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 647 score: 0.7485 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 648 score: 0.4550 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 649 score: 0.5958 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 650 score: 0.4444 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 651 score: 0.4726 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 652 score: 0.3603 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 653 score: 0.4050 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 654 score: 0.5740 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 655 score: 0.6385 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 656 score: 0.4728 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 657 score: 0.7086 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 658 score: 0.3471 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 659 score: 0.1948 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 660 score: 0.4823 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 661 score: 0.8774 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 662 score: 0.4441 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 663 score: 0.7421 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 664 score: 0.8793 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 665 score: 0.7941 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 666 score: 0.7952 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 667 score: 0.6272 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 668 score: 0.5652 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 669 score: 0.7256 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 670 score: 0.8881 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 671 score: 0.6999 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 672 score: 0.8224 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 673 score: 0.5903 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 674 score: 0.4239 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 675 score: 0.5608 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 676 score: 0.3050 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 677 score: 0.7227 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 678 score: 0.6706 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 679 score: 0.6272 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 680 score: 0.5007 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 681 score: 0.5663 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 682 score: 0.8565 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 683 score: 0.5333 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 684 score: 0.5899 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 685 score: 0.5775 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 686 score: 0.6298 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 687 score: 0.5517 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 688 score: 0.6626 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 689 score: 0.5191 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 690 score: 0.4979 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 691 score: 0.8033 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 692 score: 0.6719 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 693 score: 0.3953 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 694 score: 0.5641 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 695 score: 0.6021 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 696 score: 0.4432 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 697 score: 0.6154 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 698 score: 0.5819 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 699 score: 0.8017 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 700 score: 0.8537 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 701 score: 0.9207 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 702 score: 0.7982 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 703 score: 0.4649 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 704 score: 0.4243 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 705 score: 0.2981 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 706 score: 0.4381 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 707 score: 0.5242 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 708 score: 0.7121 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 709 score: 0.6745 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 710 score: 0.8261 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 711 score: 0.6714 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 712 score: 0.8135 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 713 score: 0.7640 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 714 score: 0.6391 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 715 score: 0.6137 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 716 score: 0.8044 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 717 score: 0.5330 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 718 score: 0.6059 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 719 score: 0.2788 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 720 score: 0.5391 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 721 score: 0.7241 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 722 score: 0.8088 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 723 score: 0.8432 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 724 score: 0.8647 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 725 score: 0.2283 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 726 score: 0.6003 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 727 score: 0.6383 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 728 score: 0.4698 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 729 score: 0.4931 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 730 score: 0.7804 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 731 score: 0.7863 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 732 score: 0.6576 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 733 score: 0.9020 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 734 score: 0.6539 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 735 score: 0.9025 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 736 score: 0.6713 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 737 score: 0.6145 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 738 score: 0.3864 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 739 score: 0.5331 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 740 score: 0.5156 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 741 score: 0.7072 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 742 score: 0.6876 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 743 score: 0.8096 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 744 score: 0.7590 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 745 score: 0.6375 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 746 score: 0.5454 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 747 score: 0.5814 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 748 score: 0.7144 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 749 score: 0.9085 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 750 score: 0.9669 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 751 score: 0.7658 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 752 score: 0.6712 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 753 score: 0.7481 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 754 score: 0.8936 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 755 score: 0.5546 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 756 score: 0.7419 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 757 score: 0.6693 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 758 score: 0.7183 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 759 score: 0.5622 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 760 score: 0.9559 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 761 score: 0.5271 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 762 score: 0.8812 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 763 score: 0.4972 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 764 score: 0.5198 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 765 score: 0.4975 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 766 score: 0.4329 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 767 score: 0.4195 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 768 score: 0.9550 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 769 score: 0.8249 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 770 score: 0.5543 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 771 score: 0.8085 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 772 score: 0.7920 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 773 score: 0.7567 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 774 score: 0.6317 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 775 score: 0.5619 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 776 score: 0.5883 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 777 score: 0.7761 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 778 score: 0.6097 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 779 score: 0.7925 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 780 score: 0.5893 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 781 score: 0.6086 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 782 score: 0.6649 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 783 score: 0.4933 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 784 score: 0.6744 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 785 score: 0.5063 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 786 score: 0.5051 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 787 score: 0.7556 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 788 score: 0.6345 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 789 score: 0.7109 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 790 score: 0.9163 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 791 score: 0.7181 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 792 score: 0.7897 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 793 score: 0.4726 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 794 score: 0.4716 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 795 score: 0.5754 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 796 score: 0.7646 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 797 score: 0.4869 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 798 score: 0.4665 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 799 score: 0.4319 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 800 score: 0.6128 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 801 score: 0.6960 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 802 score: 0.5233 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 803 score: 0.3996 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 804 score: 0.5210 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 805 score: 0.4823 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 806 score: 0.5659 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 807 score: 0.4553 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 808 score: 0.6143 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 809 score: 0.5159 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 810 score: 0.8433 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 811 score: 0.7464 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 812 score: 0.9643 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 813 score: 0.8414 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 814 score: 0.5072 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 815 score: 0.6450 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 816 score: 0.8018 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 817 score: 0.4748 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 818 score: 0.4845 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 819 score: 0.3473 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 820 score: 0.6659 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 821 score: 0.6094 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 822 score: 0.7671 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 823 score: 0.6213 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 824 score: 0.3051 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 825 score: 0.5647 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 826 score: 0.4663 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 827 score: 0.5172 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 828 score: 0.6086 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 829 score: 0.4196 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 830 score: 0.4887 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 831 score: 0.6297 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 832 score: 0.5745 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 833 score: 0.4315 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 834 score: 0.4712 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 835 score: 0.6133 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 836 score: 0.4716 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 837 score: 0.5328 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 838 score: 0.3996 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 839 score: 0.6734 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 840 score: 0.5187 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 841 score: 0.5110 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 842 score: 0.3132 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 843 score: 0.5245 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 844 score: 0.5092 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 845 score: 0.3069 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 846 score: 0.3510 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 847 score: 0.6184 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 848 score: 0.2550 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 849 score: 0.5009 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 850 score: 0.6445 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 851 score: 0.3574 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 852 score: 0.8186 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 853 score: 0.5581 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 854 score: 0.4809 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 855 score: 0.4906 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 856 score: 0.2040 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 857 score: 0.6272 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 858 score: 0.7772 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 859 score: 0.5166 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 860 score: 0.6434 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 861 score: 0.5980 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 862 score: 0.5882 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 863 score: 0.6627 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 864 score: 0.6573 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 865 score: 0.4905 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 866 score: 0.6162 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 867 score: 0.6593 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 868 score: 0.7188 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 869 score: 0.5992 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 870 score: 0.7720 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 871 score: 0.8131 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 872 score: 0.5979 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 873 score: 0.4097 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 874 score: 0.6225 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 875 score: 0.3668 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 876 score: 0.5838 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 877 score: 0.8448 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 878 score: 0.9067 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 879 score: 0.4980 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 880 score: 0.8277 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 881 score: 0.5521 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 882 score: 0.7128 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 883 score: 0.5008 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 884 score: 0.5259 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 885 score: 0.7379 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 886 score: 0.8274 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 887 score: 0.5073 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 888 score: 0.3831 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 889 score: 0.4699 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 890 score: 0.4834 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 891 score: 0.4112 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 892 score: 0.4811 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 893 score: 0.5459 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 894 score: 0.6524 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 895 score: 0.5098 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 896 score: 0.4891 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 897 score: 0.6840 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 898 score: 0.8449 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 899 score: 0.5202 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 900 score: 0.4986 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 901 score: 0.6682 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 902 score: 0.6738 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 903 score: 0.7120 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 904 score: 0.8301 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 905 score: 0.2612 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 906 score: 0.6995 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 907 score: 0.4250 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 908 score: 0.7312 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 909 score: 0.6884 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 910 score: 0.3423 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 911 score: 0.5678 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 912 score: 0.6628 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 913 score: 0.6782 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 914 score: 0.8796 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 915 score: 0.2404 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 916 score: 0.4891 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 917 score: 0.5430 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 918 score: 0.8820 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 919 score: 0.6649 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 920 score: 0.3725 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 921 score: 0.8093 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 922 score: 0.4652 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 923 score: 0.6364 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 924 score: 0.7315 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 925 score: 0.6768 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 926 score: 0.6718 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 927 score: 0.6468 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 928 score: 0.5392 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 929 score: 0.4008 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 930 score: 0.6773 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 931 score: 0.6452 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 932 score: 0.7302 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 933 score: 0.5791 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 934 score: 0.2440 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 935 score: 0.4497 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 936 score: 0.5195 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 937 score: 0.9311 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 938 score: 0.6394 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 939 score: 0.5298 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 940 score: 0.8554 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 941 score: 0.9583 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 942 score: 0.7770 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 943 score: 0.5700 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 944 score: 0.6647 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 945 score: 0.5503 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 946 score: 0.5582 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 947 score: 0.2208 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 948 score: 0.5933 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 949 score: 0.6970 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 950 score: 0.7038 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 951 score: 0.8358 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 952 score: 0.4317 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 953 score: 0.6086 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 954 score: 0.5529 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 955 score: 0.6883 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 956 score: 0.9266 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 957 score: 0.8877 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 958 score: 0.9118 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 959 score: 0.8140 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 960 score: 0.3134 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 961 score: 0.2823 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 962 score: 0.5599 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 963 score: 0.5460 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 964 score: 0.5271 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 965 score: 0.5506 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 966 score: 0.3843 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 967 score: 0.2899 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 968 score: 0.3873 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 969 score: 0.3897 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 970 score: 0.4856 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 971 score: 0.4565 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 972 score: 0.4558 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 973 score: 0.5260 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 974 score: 0.7015 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 975 score: 0.6929 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 976 score: 0.6518 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 977 score: 0.5990 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 978 score: 0.3710 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 979 score: 0.6215 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 980 score: 0.7973 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 981 score: 0.5315 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 982 score: 0.6713 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 983 score: 0.4787 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 984 score: 0.5783 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 985 score: 0.7953 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 986 score: 0.6273 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 987 score: 0.6358 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 988 score: 0.5188 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 989 score: 0.6210 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 990 score: 0.6364 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 991 score: 0.4730 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 992 score: 0.8153 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 993 score: 0.6070 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 994 score: 0.4892 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 995 score: 0.5938 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 996 score: 0.4431 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 997 score: 0.6672 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 998 score: 0.4727 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 999 score: 0.4424 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 1000 score: 0.5854 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 1001 score: 0.4855 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 1002 score: 0.7823 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 1003 score: 0.5496 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 1004 score: 0.5927 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 1005 score: 0.5260 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 1006 score: 0.4992 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 1007 score: 0.5182 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 1008 score: 0.7761 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 1009 score: 0.4554 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 1010 score: 0.5324 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv Segment 1011 score: 0.8274 +/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages//alma-13b-sft-16-languages-lv-max-tokens-512/test-en-lv score: 0.6162