TongZheng1999's picture
Upload folder using huggingface_hub
0e41f85 verified
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 0 score: 0.7249
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 1 score: 0.9216
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 2 score: 0.9079
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 3 score: 0.8298
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 4 score: 0.8325
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 5 score: 0.8385
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 6 score: 0.7970
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 7 score: 0.8654
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 8 score: 0.8976
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 9 score: 0.8055
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 10 score: 0.8492
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 11 score: 0.8505
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 12 score: 0.8500
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 13 score: 0.8292
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 14 score: 0.8304
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 15 score: 0.7146
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 16 score: 0.8315
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 17 score: 0.9198
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 18 score: 0.9290
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 19 score: 0.8890
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 20 score: 0.9357
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 21 score: 0.8638
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 22 score: 0.7485
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 23 score: 0.9142
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 24 score: 0.9308
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 25 score: 0.9685
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 26 score: 0.8620
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 27 score: 0.8075
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 28 score: 0.7720
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 29 score: 0.8967
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 30 score: 0.8117
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 31 score: 0.8246
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 32 score: 0.8887
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 33 score: 0.9300
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 34 score: 0.9363
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 35 score: 0.9501
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 36 score: 0.8295
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 37 score: 0.8901
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 38 score: 0.6796
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 39 score: 0.9395
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 40 score: 0.8455
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 41 score: 0.9567
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 42 score: 0.9045
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 43 score: 0.9037
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 44 score: 0.8185
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 45 score: 0.9014
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 46 score: 0.9013
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 47 score: 0.8428
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 48 score: 0.7499
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 49 score: 0.8707
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 50 score: 0.9260
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 51 score: 0.6967
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 52 score: 0.9008
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 53 score: 0.9320
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 54 score: 0.8764
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 55 score: 0.8331
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 56 score: 0.8996
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 57 score: 0.8322
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 58 score: 0.7636
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 59 score: 0.9240
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 60 score: 0.8437
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 61 score: 0.9229
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 62 score: 0.8250
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 63 score: 0.9062
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 64 score: 0.8695
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 65 score: 0.8134
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 66 score: 0.6961
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 67 score: 0.7315
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 68 score: 0.9105
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 69 score: 0.9047
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 70 score: 0.8702
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 71 score: 0.8514
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 72 score: 0.8451
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 73 score: 0.8852
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 74 score: 0.9051
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 75 score: 0.8963
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 76 score: 0.8996
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 77 score: 0.8820
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 78 score: 0.8865
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 79 score: 0.7027
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 80 score: 0.8870
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 81 score: 0.8892
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 82 score: 0.7625
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 83 score: 0.7115
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 84 score: 0.6901
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 85 score: 0.8814
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 86 score: 0.8031
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 87 score: 0.8557
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 88 score: 0.8882
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 89 score: 0.8392
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 90 score: 0.6267
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 91 score: 0.8389
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 92 score: 0.8809
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 93 score: 0.8335
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 94 score: 0.8326
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 95 score: 0.9144
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 96 score: 0.7093
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 97 score: 0.8504
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 98 score: 0.8935
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 99 score: 0.7952
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 100 score: 0.8948
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 101 score: 0.8511
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 102 score: 0.8807
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 103 score: 0.8755
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 104 score: 0.9002
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 105 score: 0.7995
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 106 score: 0.8803
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 107 score: 0.9100
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 108 score: 0.6467
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 109 score: 0.8498
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 110 score: 0.7659
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 111 score: 0.9460
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 112 score: 0.9548
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 113 score: 0.9490
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 114 score: 0.8146
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 115 score: 0.8567
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 116 score: 0.8979
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 117 score: 0.9089
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 118 score: 0.8202
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 119 score: 0.8596
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 120 score: 0.8691
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 121 score: 0.8816
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 122 score: 0.9390
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 123 score: 0.9504
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 124 score: 0.9076
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 125 score: 0.9277
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 126 score: 0.8677
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 127 score: 0.9014
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 128 score: 0.7566
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 129 score: 0.9022
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 130 score: 0.9218
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 131 score: 0.6541
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 132 score: 0.8859
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 133 score: 0.9039
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 134 score: 0.7635
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 135 score: 0.7793
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 136 score: 0.9347
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 137 score: 0.9009
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 138 score: 0.9180
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 139 score: 0.8128
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 140 score: 0.8563
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 141 score: 0.9294
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 142 score: 0.9473
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 143 score: 0.9037
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 144 score: 0.9702
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 145 score: 0.9324
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 146 score: 0.9364
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 147 score: 0.8765
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 148 score: 0.8415
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 149 score: 0.9211
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 150 score: 0.8937
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 151 score: 0.7884
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 152 score: 0.8310
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 153 score: 0.7924
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 154 score: 0.6982
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 155 score: 0.9086
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 156 score: 0.8790
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 157 score: 0.8888
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 158 score: 0.8523
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 159 score: 0.8400
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 160 score: 0.9444
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 161 score: 0.8323
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 162 score: 0.6765
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 163 score: 0.7828
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 164 score: 0.8439
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 165 score: 0.7370
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 166 score: 0.8829
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 167 score: 0.8379
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 168 score: 0.8841
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 169 score: 0.8995
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 170 score: 0.8875
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 171 score: 0.9231
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 172 score: 0.9250
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 173 score: 0.8955
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 174 score: 0.8753
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 175 score: 0.8821
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 176 score: 0.8347
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 177 score: 0.8581
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 178 score: 0.9227
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 179 score: 0.9429
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 180 score: 0.9125
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 181 score: 0.8859
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 182 score: 0.9270
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 183 score: 0.9428
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 184 score: 0.8387
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 185 score: 0.9285
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 186 score: 0.9482
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 187 score: 0.8347
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 188 score: 0.8700
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 189 score: 0.8495
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 190 score: 0.7640
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 191 score: 0.8790
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 192 score: 0.7163
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 193 score: 0.7971
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 194 score: 0.7942
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 195 score: 0.9044
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 196 score: 0.8984
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 197 score: 0.8658
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 198 score: 0.8769
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 199 score: 0.8293
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 200 score: 0.7272
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 201 score: 0.6888
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 202 score: 0.7704
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 203 score: 0.6182
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 204 score: 0.7467
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 205 score: 0.8718
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 206 score: 0.9220
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 207 score: 0.8771
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 208 score: 0.8675
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 209 score: 0.9066
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 210 score: 0.9494
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 211 score: 0.9363
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 212 score: 0.9213
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 213 score: 0.8053
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 214 score: 0.8861
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 215 score: 0.9304
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 216 score: 0.8827
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 217 score: 0.9424
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 218 score: 0.9307
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 219 score: 0.8492
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 220 score: 0.9235
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 221 score: 0.6839
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 222 score: 0.8752
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 223 score: 0.8829
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 224 score: 0.9104
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 225 score: 0.7337
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 226 score: 0.9037
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 227 score: 0.8447
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 228 score: 0.9199
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 229 score: 0.9294
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 230 score: 0.9697
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 231 score: 0.8475
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 232 score: 0.8848
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 233 score: 0.9067
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 234 score: 0.8058
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 235 score: 0.9141
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 236 score: 0.8219
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 237 score: 0.8669
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 238 score: 0.9386
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 239 score: 0.8541
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 240 score: 0.7709
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 241 score: 0.8547
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 242 score: 0.9276
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 243 score: 0.8502
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 244 score: 0.7826
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 245 score: 0.9109
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 246 score: 0.7973
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 247 score: 0.8344
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 248 score: 0.7729
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 249 score: 0.9414
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 250 score: 0.9122
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 251 score: 0.9303
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 252 score: 0.9185
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 253 score: 0.8597
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 254 score: 0.9542
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 255 score: 0.9293
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 256 score: 0.8604
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 257 score: 0.9314
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 258 score: 0.8917
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 259 score: 0.8631
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 260 score: 0.9458
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 261 score: 0.7915
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 262 score: 0.8807
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 263 score: 0.7872
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 264 score: 0.8994
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 265 score: 0.8447
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 266 score: 0.9193
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 267 score: 0.8890
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 268 score: 0.9292
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 269 score: 0.8562
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 270 score: 0.8573
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 271 score: 0.8477
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 272 score: 0.9189
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 273 score: 0.8175
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 274 score: 0.7855
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 275 score: 0.8356
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 276 score: 0.8919
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 277 score: 0.8894
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 278 score: 0.8515
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 279 score: 0.9561
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 280 score: 0.9040
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 281 score: 0.9305
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 282 score: 0.9078
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 283 score: 0.8365
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 284 score: 0.9469
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 285 score: 0.9606
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 286 score: 0.7951
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 287 score: 0.8009
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 288 score: 0.8952
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 289 score: 0.8732
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 290 score: 0.8054
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 291 score: 0.8382
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 292 score: 0.8942
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 293 score: 0.9191
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 294 score: 0.7557
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 295 score: 0.8454
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 296 score: 0.8970
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 297 score: 0.6828
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 298 score: 0.9251
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 299 score: 0.9244
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 300 score: 0.8943
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 301 score: 0.8272
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 302 score: 0.8443
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 303 score: 0.9262
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 304 score: 0.8353
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 305 score: 0.7959
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 306 score: 0.9511
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 307 score: 0.8735
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 308 score: 0.8092
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 309 score: 0.8187
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 310 score: 0.9357
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 311 score: 0.8828
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 312 score: 0.9159
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 313 score: 0.7372
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 314 score: 0.9478
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 315 score: 0.9241
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 316 score: 0.8809
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 317 score: 0.8576
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 318 score: 0.7416
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 319 score: 0.8614
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 320 score: 0.8620
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 321 score: 0.7963
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 322 score: 0.9075
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 323 score: 0.9047
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 324 score: 0.9082
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 325 score: 0.8865
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 326 score: 0.7974
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 327 score: 0.8789
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 328 score: 0.8911
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 329 score: 0.9146
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 330 score: 0.9550
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 331 score: 0.7985
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 332 score: 0.9133
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 333 score: 0.8429
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 334 score: 0.9252
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 335 score: 0.8747
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 336 score: 0.9170
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 337 score: 0.8720
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 338 score: 0.9030
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 339 score: 0.9199
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 340 score: 0.7606
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 341 score: 0.8710
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 342 score: 0.8141
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 343 score: 0.8441
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 344 score: 0.8988
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 345 score: 0.7329
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 346 score: 0.9212
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 347 score: 0.9299
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 348 score: 0.7543
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 349 score: 0.8000
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 350 score: 0.8433
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 351 score: 0.8057
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 352 score: 0.8581
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 353 score: 0.8806
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 354 score: 0.8345
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 355 score: 0.9115
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 356 score: 0.9052
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 357 score: 0.9182
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 358 score: 0.9136
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 359 score: 0.7280
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 360 score: 0.8943
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 361 score: 0.9105
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 362 score: 0.8573
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 363 score: 0.6533
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 364 score: 0.8296
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 365 score: 0.8620
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 366 score: 0.7784
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 367 score: 0.8158
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 368 score: 0.8002
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 369 score: 0.8795
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 370 score: 0.6847
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 371 score: 0.7372
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 372 score: 0.9046
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 373 score: 0.9034
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 374 score: 0.9218
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 375 score: 0.8977
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 376 score: 0.9176
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 377 score: 0.9370
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 378 score: 0.7719
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 379 score: 0.8711
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 380 score: 0.8744
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 381 score: 0.8597
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 382 score: 0.8034
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 383 score: 0.8500
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 384 score: 0.8989
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 385 score: 0.7672
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 386 score: 0.8237
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 387 score: 0.8795
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 388 score: 0.8342
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 389 score: 0.9081
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 390 score: 0.8386
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 391 score: 0.8442
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 392 score: 0.6989
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 393 score: 0.8831
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 394 score: 0.9334
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 395 score: 0.8253
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 396 score: 0.8749
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 397 score: 0.9137
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 398 score: 0.8339
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 399 score: 0.8534
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 400 score: 0.9501
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 401 score: 0.8421
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 402 score: 0.8960
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 403 score: 0.7298
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 404 score: 0.8340
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 405 score: 0.8423
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 406 score: 0.9073
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 407 score: 0.8710
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 408 score: 0.9458
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 409 score: 0.9153
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 410 score: 0.9146
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 411 score: 0.8252
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 412 score: 0.8029
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 413 score: 0.8978
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 414 score: 0.9253
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 415 score: 0.8930
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 416 score: 0.9464
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 417 score: 0.8294
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 418 score: 0.9237
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 419 score: 0.8511
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 420 score: 0.9380
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 421 score: 0.9326
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 422 score: 0.8962
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 423 score: 0.8145
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 424 score: 0.8713
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 425 score: 0.9299
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 426 score: 0.9409
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 427 score: 0.9336
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 428 score: 0.7756
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 429 score: 0.9158
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 430 score: 0.8785
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 431 score: 0.8662
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 432 score: 0.8854
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 433 score: 0.8370
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 434 score: 0.8537
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 435 score: 0.7078
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 436 score: 0.8844
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 437 score: 0.7300
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 438 score: 0.9358
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 439 score: 0.9108
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 440 score: 0.9157
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 441 score: 0.8901
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 442 score: 0.9151
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 443 score: 0.8870
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 444 score: 0.8235
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 445 score: 0.7637
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 446 score: 0.8335
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 447 score: 0.8962
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 448 score: 0.9484
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 449 score: 0.8879
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 450 score: 0.9000
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 451 score: 0.8552
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 452 score: 0.9113
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 453 score: 0.2193
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 454 score: 0.9188
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 455 score: 0.8279
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 456 score: 0.8124
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 457 score: 0.9380
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 458 score: 0.9101
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 459 score: 0.7308
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 460 score: 0.9158
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 461 score: 0.8369
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 462 score: 0.8868
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 463 score: 0.9459
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 464 score: 0.8032
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 465 score: 0.8593
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 466 score: 0.9389
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 467 score: 0.7310
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 468 score: 0.6750
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 469 score: 0.8642
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 470 score: 0.7519
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 471 score: 0.8244
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 472 score: 0.7263
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 473 score: 0.6637
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 474 score: 0.7227
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 475 score: 0.9342
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 476 score: 0.8715
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 477 score: 0.8965
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 478 score: 0.8844
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 479 score: 0.8723
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 480 score: 0.8805
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 481 score: 0.7516
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 482 score: 0.8888
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 483 score: 0.9023
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 484 score: 0.8924
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 485 score: 0.8736
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 486 score: 0.8750
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 487 score: 0.8440
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 488 score: 0.9242
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 489 score: 0.8682
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 490 score: 0.8674
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 491 score: 0.8352
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 492 score: 0.9365
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 493 score: 0.9307
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 494 score: 0.8874
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 495 score: 0.8436
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 496 score: 0.8462
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 497 score: 0.8039
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 498 score: 0.8690
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 499 score: 0.8964
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 500 score: 0.9167
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 501 score: 0.9167
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 502 score: 0.8090
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 503 score: 0.7818
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 504 score: 0.8442
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 505 score: 0.8744
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 506 score: 0.7020
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 507 score: 0.9104
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 508 score: 0.6400
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 509 score: 0.8501
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 510 score: 0.7111
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 511 score: 0.6744
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 512 score: 0.8791
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 513 score: 0.8288
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 514 score: 0.8827
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 515 score: 0.8320
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 516 score: 0.7570
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 517 score: 0.9097
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 518 score: 0.9490
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 519 score: 0.8678
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 520 score: 0.9339
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 521 score: 0.9208
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 522 score: 0.8513
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 523 score: 0.7272
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 524 score: 0.8754
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 525 score: 0.9134
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 526 score: 0.8480
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 527 score: 0.6666
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 528 score: 0.8515
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 529 score: 0.8511
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 530 score: 0.7957
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 531 score: 0.8587
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 532 score: 0.7646
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 533 score: 0.8411
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 534 score: 0.7764
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 535 score: 0.7383
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 536 score: 0.8751
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 537 score: 0.8804
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 538 score: 0.8089
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 539 score: 0.9044
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 540 score: 0.9182
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 541 score: 0.8985
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 542 score: 0.9105
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 543 score: 0.8287
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 544 score: 0.8846
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 545 score: 0.8404
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 546 score: 0.8389
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 547 score: 0.8843
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 548 score: 0.8483
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 549 score: 0.9169
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 550 score: 0.8415
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 551 score: 0.8912
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 552 score: 0.8394
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 553 score: 0.8604
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 554 score: 0.8593
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 555 score: 0.7204
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 556 score: 0.8415
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 557 score: 0.7614
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 558 score: 0.8301
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 559 score: 0.8114
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 560 score: 0.6507
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 561 score: 0.8968
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 562 score: 0.8960
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 563 score: 0.7686
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 564 score: 0.8828
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 565 score: 0.9034
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 566 score: 0.8961
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 567 score: 0.9169
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 568 score: 0.8554
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 569 score: 0.8668
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 570 score: 0.9081
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 571 score: 0.8335
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 572 score: 0.7831
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 573 score: 0.9291
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 574 score: 0.9289
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 575 score: 0.9415
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 576 score: 0.6872
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 577 score: 0.8691
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 578 score: 0.9318
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 579 score: 0.1750
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 580 score: 0.1900
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 581 score: 0.8327
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 582 score: 0.8392
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 583 score: 0.8433
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 584 score: 0.6132
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 585 score: 0.8974
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 586 score: 0.8703
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 587 score: 0.9494
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 588 score: 0.8804
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 589 score: 0.8142
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 590 score: 0.8699
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 591 score: 0.9235
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 592 score: 0.7828
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 593 score: 0.9032
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 594 score: 0.8860
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 595 score: 0.8736
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 596 score: 0.9035
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 597 score: 0.8270
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 598 score: 0.6145
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 599 score: 0.9011
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 600 score: 0.8586
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 601 score: 0.8652
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 602 score: 0.8416
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 603 score: 0.8872
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 604 score: 0.9214
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 605 score: 0.9164
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 606 score: 0.8558
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 607 score: 0.7558
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 608 score: 0.6836
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 609 score: 0.8520
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 610 score: 0.8994
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 611 score: 0.9013
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 612 score: 0.8571
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 613 score: 0.8893
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 614 score: 0.8748
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 615 score: 0.8835
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 616 score: 0.9057
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 617 score: 0.9286
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 618 score: 0.9334
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 619 score: 0.8443
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 620 score: 0.8960
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 621 score: 0.7853
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 622 score: 0.7874
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 623 score: 0.8756
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 624 score: 0.8855
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 625 score: 0.9235
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 626 score: 0.9269
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 627 score: 0.8736
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 628 score: 0.9611
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 629 score: 0.8671
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 630 score: 0.8453
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 631 score: 0.8984
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 632 score: 0.9660
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 633 score: 0.9273
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 634 score: 0.9660
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 635 score: 0.9304
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 636 score: 0.9234
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 637 score: 0.9105
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 638 score: 0.8263
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 639 score: 0.9610
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 640 score: 0.7833
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 641 score: 0.8721
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 642 score: 0.7299
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 643 score: 0.8899
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 644 score: 0.8370
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 645 score: 0.6555
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 646 score: 0.7800
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 647 score: 0.9118
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 648 score: 0.7832
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 649 score: 0.8883
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 650 score: 0.9316
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 651 score: 0.7005
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 652 score: 0.8607
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 653 score: 0.8009
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 654 score: 0.7323
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 655 score: 0.7961
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 656 score: 0.8515
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 657 score: 0.9397
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 658 score: 0.7879
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 659 score: 0.8841
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 660 score: 0.8566
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 661 score: 0.9321
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 662 score: 0.9042
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 663 score: 0.7725
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 664 score: 0.9290
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 665 score: 0.9266
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 666 score: 0.9194
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 667 score: 0.8489
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 668 score: 0.8713
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 669 score: 0.8279
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 670 score: 0.8662
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 671 score: 0.9346
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 672 score: 0.9089
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 673 score: 0.9175
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 674 score: 0.8816
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 675 score: 0.9093
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 676 score: 0.9393
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 677 score: 0.9433
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 678 score: 0.9099
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 679 score: 0.9067
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 680 score: 0.9021
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 681 score: 0.9194
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 682 score: 0.9364
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 683 score: 0.8441
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 684 score: 0.9039
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 685 score: 0.6992
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 686 score: 0.8767
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 687 score: 0.9247
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 688 score: 0.9047
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 689 score: 0.8449
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 690 score: 0.8743
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 691 score: 0.8981
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 692 score: 0.9255
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 693 score: 0.8137
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 694 score: 0.7026
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 695 score: 0.8730
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 696 score: 0.9097
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 697 score: 0.9305
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 698 score: 0.8488
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 699 score: 0.9056
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 700 score: 0.8999
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 701 score: 0.9383
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 702 score: 0.9113
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 703 score: 0.8502
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 704 score: 0.7936
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 705 score: 0.7720
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 706 score: 0.7074
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 707 score: 0.8540
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 708 score: 0.8833
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 709 score: 0.8637
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 710 score: 0.9289
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 711 score: 0.8530
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 712 score: 0.9414
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 713 score: 0.8991
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 714 score: 0.9112
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 715 score: 0.8182
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 716 score: 0.9068
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 717 score: 0.7514
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 718 score: 0.9454
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 719 score: 0.9292
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 720 score: 0.8655
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 721 score: 0.8868
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 722 score: 0.8987
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 723 score: 0.9251
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 724 score: 0.8289
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 725 score: 0.9376
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 726 score: 0.8939
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 727 score: 0.9533
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 728 score: 0.6592
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 729 score: 0.9064
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 730 score: 0.8330
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 731 score: 0.8861
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 732 score: 0.8250
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 733 score: 0.9245
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 734 score: 0.8420
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 735 score: 0.8629
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 736 score: 0.8988
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 737 score: 0.2590
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 738 score: 0.8715
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 739 score: 0.7218
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 740 score: 0.8637
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 741 score: 0.8840
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 742 score: 0.8957
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 743 score: 0.8837
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 744 score: 0.8965
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 745 score: 0.8834
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 746 score: 0.9362
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 747 score: 0.9015
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 748 score: 0.9224
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 749 score: 0.9157
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 750 score: 0.9512
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 751 score: 0.9116
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 752 score: 0.8858
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 753 score: 0.9190
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 754 score: 0.9399
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 755 score: 0.8951
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 756 score: 0.8475
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 757 score: 0.8965
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 758 score: 0.8084
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 759 score: 0.9081
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 760 score: 0.9280
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 761 score: 0.8832
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 762 score: 0.9223
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 763 score: 0.8631
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 764 score: 0.8504
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 765 score: 0.8473
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 766 score: 0.9011
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 767 score: 0.7473
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 768 score: 0.9405
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 769 score: 0.8740
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 770 score: 0.9323
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 771 score: 0.8247
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 772 score: 0.7896
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 773 score: 0.9448
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 774 score: 0.8964
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 775 score: 0.8040
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 776 score: 0.8386
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 777 score: 0.8504
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 778 score: 0.8921
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 779 score: 0.6884
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 780 score: 0.8975
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 781 score: 0.7596
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 782 score: 0.8582
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 783 score: 0.7313
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 784 score: 0.9018
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 785 score: 0.7714
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 786 score: 0.9071
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 787 score: 0.9281
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 788 score: 0.9024
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 789 score: 0.8638
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 790 score: 0.8850
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 791 score: 0.8771
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 792 score: 0.9101
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 793 score: 0.8231
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 794 score: 0.8216
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 795 score: 0.8845
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 796 score: 0.9133
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 797 score: 0.8523
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 798 score: 0.8179
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 799 score: 0.8424
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 800 score: 0.8066
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 801 score: 0.8310
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 802 score: 0.9030
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 803 score: 0.8026
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 804 score: 0.7390
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 805 score: 0.8512
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 806 score: 0.8476
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 807 score: 0.8700
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 808 score: 0.9132
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 809 score: 0.8241
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 810 score: 0.8296
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 811 score: 0.8570
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 812 score: 0.9282
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 813 score: 0.9010
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 814 score: 0.9335
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 815 score: 0.7961
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 816 score: 0.9028
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 817 score: 0.8249
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 818 score: 0.6958
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 819 score: 0.6631
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 820 score: 0.8855
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 821 score: 0.8486
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 822 score: 0.8441
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 823 score: 0.8513
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 824 score: 0.8872
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 825 score: 0.8372
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 826 score: 0.8300
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 827 score: 0.7163
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 828 score: 0.8078
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 829 score: 0.8530
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 830 score: 0.7910
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 831 score: 0.8353
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 832 score: 0.7528
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 833 score: 0.6196
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 834 score: 0.8267
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 835 score: 0.7963
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 836 score: 0.8224
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 837 score: 0.9085
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 838 score: 0.8977
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 839 score: 0.7721
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 840 score: 0.8764
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 841 score: 0.8456
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 842 score: 0.7983
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 843 score: 0.8425
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 844 score: 0.7976
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 845 score: 0.6468
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 846 score: 0.2276
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 847 score: 0.9040
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 848 score: 0.7195
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 849 score: 0.8479
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 850 score: 0.8639
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 851 score: 0.9291
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 852 score: 0.8526
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 853 score: 0.8422
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 854 score: 0.8617
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 855 score: 0.8972
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 856 score: 0.7360
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 857 score: 0.9248
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 858 score: 0.9331
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 859 score: 0.9386
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 860 score: 0.9020
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 861 score: 0.8421
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 862 score: 0.8945
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 863 score: 0.8817
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 864 score: 0.8040
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 865 score: 0.7106
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 866 score: 0.9044
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 867 score: 0.8660
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 868 score: 0.9081
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 869 score: 0.8712
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 870 score: 0.9587
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 871 score: 0.8960
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 872 score: 0.9134
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 873 score: 0.9117
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 874 score: 0.9432
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 875 score: 0.8533
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 876 score: 0.7338
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 877 score: 0.8973
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 878 score: 0.9445
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 879 score: 0.8381
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 880 score: 0.9185
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 881 score: 0.9353
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 882 score: 0.9283
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 883 score: 0.8772
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 884 score: 0.8427
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 885 score: 0.7996
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 886 score: 0.8544
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 887 score: 0.8071
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 888 score: 0.6887
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 889 score: 0.8760
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 890 score: 0.8564
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 891 score: 0.8751
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 892 score: 0.8066
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 893 score: 0.7153
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 894 score: 0.8809
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 895 score: 0.8996
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 896 score: 0.8985
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 897 score: 0.8799
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 898 score: 0.9376
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 899 score: 0.7896
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 900 score: 0.8538
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 901 score: 0.9166
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 902 score: 0.7185
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 903 score: 0.8963
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 904 score: 0.9012
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 905 score: 0.6891
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 906 score: 0.9379
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 907 score: 0.7697
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 908 score: 0.8849
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 909 score: 0.9044
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 910 score: 0.9039
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 911 score: 0.8875
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 912 score: 0.9177
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 913 score: 0.7898
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 914 score: 0.8153
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 915 score: 0.8691
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 916 score: 0.7484
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 917 score: 0.8242
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 918 score: 0.7957
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 919 score: 0.7920
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 920 score: 0.8707
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 921 score: 0.8458
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 922 score: 0.8569
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 923 score: 0.8909
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 924 score: 0.8986
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 925 score: 0.8756
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 926 score: 0.9415
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 927 score: 0.8358
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 928 score: 0.8119
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 929 score: 0.8280
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 930 score: 0.8916
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 931 score: 0.8774
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 932 score: 0.7668
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 933 score: 0.8735
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 934 score: 0.8218
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 935 score: 0.8760
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 936 score: 0.7190
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 937 score: 0.9672
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 938 score: 0.9586
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 939 score: 0.9158
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 940 score: 0.8756
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 941 score: 0.9925
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 942 score: 0.9515
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 943 score: 0.9172
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 944 score: 0.8957
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 945 score: 0.9098
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 946 score: 0.9137
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 947 score: 0.8752
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 948 score: 0.8427
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 949 score: 0.8923
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 950 score: 0.8756
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 951 score: 0.8457
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 952 score: 0.8297
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 953 score: 0.8661
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 954 score: 0.8166
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 955 score: 0.8733
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 956 score: 0.9190
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 957 score: 0.9394
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 958 score: 0.9226
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 959 score: 0.7684
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 960 score: 0.8178
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 961 score: 0.6713
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 962 score: 0.8569
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 963 score: 0.8444
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 964 score: 0.9316
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 965 score: 0.8124
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 966 score: 0.8617
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 967 score: 0.7917
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 968 score: 0.8311
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 969 score: 0.7999
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 970 score: 0.8576
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 971 score: 0.8195
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 972 score: 0.8876
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 973 score: 0.9227
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 974 score: 0.8008
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 975 score: 0.8895
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 976 score: 0.8611
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 977 score: 0.8468
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 978 score: 0.8899
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 979 score: 0.8577
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 980 score: 0.8673
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 981 score: 0.8344
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 982 score: 0.8102
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 983 score: 0.7629
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 984 score: 0.8950
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 985 score: 0.9002
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 986 score: 0.9432
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 987 score: 0.8404
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 988 score: 0.6909
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 989 score: 0.8546
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 990 score: 0.9456
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 991 score: 0.8609
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 992 score: 0.8692
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 993 score: 0.8338
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 994 score: 0.7961
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 995 score: 0.8360
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 996 score: 0.7947
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 997 score: 0.9397
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 998 score: 0.8810
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 999 score: 0.8926
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 1000 score: 0.8935
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 1001 score: 0.8438
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 1002 score: 0.9083
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 1003 score: 0.8474
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 1004 score: 0.9307
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 1005 score: 0.9272
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 1006 score: 0.9388
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 1007 score: 0.9331
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 1008 score: 0.9614
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 1009 score: 0.8383
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 1010 score: 0.8957
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms Segment 1011 score: 0.8835
/beacon-scratch/tongzh24/ALMA-checkpoint/exp_16_languages/alma-13b-sft-16-languages-ms-max-tokens-512//test-en-ms score: 0.8564