TongZheng1999's picture
Upload folder using huggingface_hub
e2edaeb verified
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 0 score: 0.8553
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 1 score: 0.9268
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 2 score: 0.9173
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 3 score: 0.8473
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 4 score: 0.9123
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 5 score: 0.6846
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 6 score: 0.8345
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 7 score: 0.8649
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 8 score: 0.8047
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 9 score: 0.8582
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 10 score: 0.9547
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 11 score: 0.8166
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 12 score: 0.9037
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 13 score: 0.8165
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 14 score: 0.8886
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 15 score: 0.8194
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 16 score: 0.8631
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 17 score: 0.9456
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 18 score: 0.9397
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 19 score: 0.8736
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 20 score: 0.9429
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 21 score: 0.8792
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 22 score: 0.7805
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 23 score: 0.9093
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 24 score: 0.9297
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 25 score: 0.9592
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 26 score: 0.8836
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 27 score: 0.8563
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 28 score: 0.8907
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 29 score: 0.9377
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 30 score: 0.7837
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 31 score: 0.8755
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 32 score: 0.8661
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 33 score: 0.9333
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 34 score: 0.9437
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 35 score: 0.9378
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 36 score: 0.9163
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 37 score: 0.8374
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 38 score: 0.9080
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 39 score: 0.9102
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 40 score: 0.8683
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 41 score: 0.9552
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 42 score: 0.8747
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 43 score: 0.9089
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 44 score: 0.8817
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 45 score: 0.9209
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 46 score: 0.9444
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 47 score: 0.8784
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 48 score: 0.9450
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 49 score: 0.9286
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 50 score: 0.9363
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 51 score: 0.9279
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 52 score: 0.9427
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 53 score: 0.9404
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 54 score: 0.9358
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 55 score: 0.9176
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 56 score: 0.9097
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 57 score: 0.8845
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 58 score: 0.8648
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 59 score: 0.9629
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 60 score: 0.9457
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 61 score: 0.9556
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 62 score: 0.8143
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 63 score: 0.9386
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 64 score: 0.8788
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 65 score: 0.8055
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 66 score: 0.7726
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 67 score: 0.6469
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 68 score: 0.9531
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 69 score: 0.9149
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 70 score: 0.8979
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 71 score: 0.9032
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 72 score: 0.8761
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 73 score: 0.8800
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 74 score: 0.9063
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 75 score: 0.8969
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 76 score: 0.8681
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 77 score: 0.9337
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 78 score: 0.8812
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 79 score: 0.9536
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 80 score: 0.8966
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 81 score: 0.9690
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 82 score: 0.9062
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 83 score: 0.8595
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 84 score: 0.9369
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 85 score: 0.9167
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 86 score: 0.8926
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 87 score: 0.9053
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 88 score: 0.9434
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 89 score: 0.9011
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 90 score: 0.9180
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 91 score: 0.8948
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 92 score: 0.8580
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 93 score: 0.8806
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 94 score: 0.9415
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 95 score: 0.9228
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 96 score: 0.8080
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 97 score: 0.9291
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 98 score: 0.9485
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 99 score: 0.9201
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 100 score: 0.9376
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 101 score: 0.9264
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 102 score: 0.9268
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 103 score: 0.9903
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 104 score: 0.9106
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 105 score: 0.8232
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 106 score: 0.9519
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 107 score: 0.9111
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 108 score: 0.8864
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 109 score: 0.7958
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 110 score: 0.9021
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 111 score: 0.9672
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 112 score: 0.9461
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 113 score: 0.9446
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 114 score: 0.9119
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 115 score: 0.9259
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 116 score: 0.9378
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 117 score: 0.9450
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 118 score: 0.8587
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 119 score: 0.8539
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 120 score: 0.8312
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 121 score: 0.9155
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 122 score: 0.9414
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 123 score: 0.9665
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 124 score: 0.8716
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 125 score: 0.9321
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 126 score: 0.9451
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 127 score: 0.9219
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 128 score: 0.9283
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 129 score: 0.9054
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 130 score: 0.9420
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 131 score: 0.8991
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 132 score: 0.9301
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 133 score: 0.8710
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 134 score: 0.8652
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 135 score: 0.7287
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 136 score: 0.8934
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 137 score: 0.7982
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 138 score: 0.9070
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 139 score: 0.9273
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 140 score: 0.9076
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 141 score: 0.9170
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 142 score: 0.9414
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 143 score: 0.9191
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 144 score: 0.8044
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 145 score: 0.9367
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 146 score: 0.9406
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 147 score: 0.9136
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 148 score: 0.9131
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 149 score: 0.8937
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 150 score: 0.9462
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 151 score: 0.8996
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 152 score: 0.8839
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 153 score: 0.7675
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 154 score: 0.8198
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 155 score: 0.9188
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 156 score: 0.9065
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 157 score: 0.8552
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 158 score: 0.9224
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 159 score: 0.9094
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 160 score: 0.9208
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 161 score: 0.8441
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 162 score: 0.8890
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 163 score: 0.9066
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 164 score: 0.9310
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 165 score: 0.8578
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 166 score: 0.9194
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 167 score: 0.8997
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 168 score: 0.8988
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 169 score: 0.8299
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 170 score: 0.8643
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 171 score: 0.8629
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 172 score: 0.7928
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 173 score: 0.9396
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 174 score: 0.8825
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 175 score: 0.9333
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 176 score: 0.7916
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 177 score: 0.8908
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 178 score: 0.9259
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 179 score: 0.9262
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 180 score: 0.9228
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 181 score: 0.9419
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 182 score: 0.8901
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 183 score: 0.9366
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 184 score: 0.8766
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 185 score: 0.9614
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 186 score: 0.9237
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 187 score: 0.9436
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 188 score: 0.8971
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 189 score: 0.9268
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 190 score: 0.9060
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 191 score: 0.9380
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 192 score: 0.8592
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 193 score: 0.8343
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 194 score: 0.8937
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 195 score: 0.9192
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 196 score: 0.9408
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 197 score: 0.8439
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 198 score: 0.9073
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 199 score: 0.8638
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 200 score: 0.8230
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 201 score: 0.8562
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 202 score: 0.8076
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 203 score: 0.8412
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 204 score: 0.9040
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 205 score: 0.9348
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 206 score: 0.9275
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 207 score: 0.9131
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 208 score: 0.9402
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 209 score: 0.8950
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 210 score: 0.9537
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 211 score: 0.9332
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 212 score: 0.9585
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 213 score: 0.8302
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 214 score: 0.9151
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 215 score: 0.8776
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 216 score: 0.9359
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 217 score: 0.9385
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 218 score: 0.9572
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 219 score: 0.9329
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 220 score: 0.9490
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 221 score: 0.9225
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 222 score: 0.9105
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 223 score: 0.9229
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 224 score: 0.9035
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 225 score: 0.9391
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 226 score: 0.9468
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 227 score: 0.8171
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 228 score: 0.8197
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 229 score: 0.7976
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 230 score: 0.9575
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 231 score: 0.8758
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 232 score: 0.8518
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 233 score: 0.8868
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 234 score: 0.8234
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 235 score: 0.7602
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 236 score: 0.8035
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 237 score: 0.9059
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 238 score: 0.9395
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 239 score: 0.8577
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 240 score: 0.7420
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 241 score: 0.6356
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 242 score: 0.9394
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 243 score: 0.7882
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 244 score: 0.8840
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 245 score: 0.9367
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 246 score: 0.8133
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 247 score: 0.8351
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 248 score: 0.8628
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 249 score: 0.9447
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 250 score: 0.9143
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 251 score: 0.9532
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 252 score: 0.9426
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 253 score: 0.9612
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 254 score: 0.9731
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 255 score: 0.9541
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 256 score: 0.8390
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 257 score: 0.9276
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 258 score: 0.9237
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 259 score: 0.9057
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 260 score: 0.8881
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 261 score: 0.7389
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 262 score: 0.8752
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 263 score: 0.9110
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 264 score: 0.9316
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 265 score: 0.9108
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 266 score: 0.8906
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 267 score: 0.8790
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 268 score: 0.8593
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 269 score: 0.9307
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 270 score: 0.9153
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 271 score: 0.8245
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 272 score: 0.9414
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 273 score: 0.9200
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 274 score: 0.8655
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 275 score: 0.8012
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 276 score: 0.8976
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 277 score: 0.9428
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 278 score: 0.9243
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 279 score: 0.8813
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 280 score: 0.9329
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 281 score: 0.9365
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 282 score: 0.9587
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 283 score: 0.9086
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 284 score: 0.9453
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 285 score: 0.9575
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 286 score: 0.8565
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 287 score: 0.8681
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 288 score: 0.9371
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 289 score: 0.9026
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 290 score: 0.8674
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 291 score: 0.8117
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 292 score: 0.8733
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 293 score: 0.9214
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 294 score: 0.9111
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 295 score: 0.7883
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 296 score: 0.8360
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 297 score: 0.8895
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 298 score: 0.7100
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 299 score: 0.9216
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 300 score: 0.9371
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 301 score: 0.8448
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 302 score: 0.9040
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 303 score: 0.9438
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 304 score: 0.9185
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 305 score: 0.9374
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 306 score: 0.8884
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 307 score: 0.8369
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 308 score: 0.9293
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 309 score: 0.9031
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 310 score: 0.9486
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 311 score: 0.9521
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 312 score: 0.9513
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 313 score: 0.8824
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 314 score: 0.9474
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 315 score: 0.9554
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 316 score: 0.9434
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 317 score: 0.8745
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 318 score: 0.8270
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 319 score: 0.8247
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 320 score: 0.8663
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 321 score: 0.7771
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 322 score: 0.9207
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 323 score: 0.9194
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 324 score: 0.9465
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 325 score: 0.9359
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 326 score: 0.8401
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 327 score: 0.9294
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 328 score: 0.9320
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 329 score: 0.8954
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 330 score: 0.9198
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 331 score: 0.9453
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 332 score: 0.9053
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 333 score: 0.8676
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 334 score: 0.9691
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 335 score: 0.9156
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 336 score: 0.8637
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 337 score: 0.7962
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 338 score: 0.9424
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 339 score: 0.9206
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 340 score: 0.8682
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 341 score: 0.9239
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 342 score: 0.7496
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 343 score: 0.8835
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 344 score: 0.9057
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 345 score: 0.8930
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 346 score: 0.9532
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 347 score: 0.9346
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 348 score: 0.9297
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 349 score: 0.8261
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 350 score: 0.9325
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 351 score: 0.8735
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 352 score: 0.9113
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 353 score: 0.8789
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 354 score: 0.8700
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 355 score: 0.9152
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 356 score: 0.9062
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 357 score: 0.9137
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 358 score: 0.8166
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 359 score: 0.8478
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 360 score: 0.8458
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 361 score: 0.8817
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 362 score: 0.9550
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 363 score: 0.7710
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 364 score: 0.9287
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 365 score: 0.8252
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 366 score: 0.8237
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 367 score: 0.9013
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 368 score: 0.8395
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 369 score: 0.9112
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 370 score: 0.8393
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 371 score: 0.7705
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 372 score: 0.8943
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 373 score: 0.8768
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 374 score: 0.9398
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 375 score: 0.9403
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 376 score: 0.9438
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 377 score: 0.9411
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 378 score: 0.8037
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 379 score: 0.9317
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 380 score: 0.9292
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 381 score: 0.9455
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 382 score: 0.7749
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 383 score: 0.8774
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 384 score: 0.8101
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 385 score: 0.8485
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 386 score: 0.7986
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 387 score: 0.9269
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 388 score: 0.9263
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 389 score: 0.8034
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 390 score: 0.9327
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 391 score: 0.9101
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 392 score: 0.9204
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 393 score: 0.9101
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 394 score: 0.9417
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 395 score: 0.9621
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 396 score: 0.8961
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 397 score: 0.9343
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 398 score: 0.8682
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 399 score: 0.9513
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 400 score: 0.9595
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 401 score: 0.8932
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 402 score: 0.9011
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 403 score: 0.8769
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 404 score: 0.8640
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 405 score: 0.8546
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 406 score: 0.8924
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 407 score: 0.9203
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 408 score: 0.9340
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 409 score: 0.9000
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 410 score: 0.9178
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 411 score: 0.8726
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 412 score: 0.8891
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 413 score: 0.9601
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 414 score: 0.8972
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 415 score: 0.9340
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 416 score: 0.8608
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 417 score: 0.8210
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 418 score: 0.9474
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 419 score: 0.9231
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 420 score: 0.9705
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 421 score: 0.9475
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 422 score: 0.9319
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 423 score: 0.8551
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 424 score: 0.9130
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 425 score: 0.9447
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 426 score: 0.9159
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 427 score: 0.8929
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 428 score: 0.9224
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 429 score: 0.9277
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 430 score: 0.8906
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 431 score: 0.8796
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 432 score: 0.8814
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 433 score: 0.8465
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 434 score: 0.8456
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 435 score: 0.7763
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 436 score: 0.8873
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 437 score: 0.8595
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 438 score: 0.9530
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 439 score: 0.9537
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 440 score: 0.9356
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 441 score: 0.9186
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 442 score: 0.9393
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 443 score: 0.9056
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 444 score: 0.8869
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 445 score: 0.8855
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 446 score: 0.9313
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 447 score: 0.9426
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 448 score: 0.9526
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 449 score: 0.8636
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 450 score: 0.9216
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 451 score: 0.9415
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 452 score: 0.9591
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 453 score: 0.8859
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 454 score: 0.9267
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 455 score: 0.8476
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 456 score: 0.8511
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 457 score: 0.9566
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 458 score: 0.9286
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 459 score: 0.8892
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 460 score: 0.9121
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 461 score: 0.8693
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 462 score: 0.9254
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 463 score: 0.9522
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 464 score: 0.9221
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 465 score: 0.9078
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 466 score: 0.9475
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 467 score: 0.7468
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 468 score: 0.7321
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 469 score: 0.7425
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 470 score: 0.8177
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 471 score: 0.8768
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 472 score: 0.8542
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 473 score: 0.8567
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 474 score: 0.8278
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 475 score: 0.9240
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 476 score: 0.8973
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 477 score: 0.9120
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 478 score: 0.8786
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 479 score: 0.9012
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 480 score: 0.8928
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 481 score: 0.9136
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 482 score: 0.9162
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 483 score: 0.8769
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 484 score: 0.9016
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 485 score: 0.9267
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 486 score: 0.9134
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 487 score: 0.9060
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 488 score: 0.9187
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 489 score: 0.9408
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 490 score: 0.9004
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 491 score: 0.9200
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 492 score: 0.9022
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 493 score: 0.9531
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 494 score: 0.8897
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 495 score: 0.9136
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 496 score: 0.9077
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 497 score: 0.8872
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 498 score: 0.9290
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 499 score: 0.9373
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 500 score: 0.9591
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 501 score: 0.9457
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 502 score: 0.9264
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 503 score: 0.8952
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 504 score: 0.8408
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 505 score: 0.9250
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 506 score: 0.8857
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 507 score: 0.8543
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 508 score: 0.8090
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 509 score: 0.8158
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 510 score: 0.8085
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 511 score: 0.8512
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 512 score: 0.8302
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 513 score: 0.8909
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 514 score: 0.9537
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 515 score: 0.9449
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 516 score: 0.7666
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 517 score: 0.9160
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 518 score: 0.9222
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 519 score: 0.9635
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 520 score: 0.8943
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 521 score: 0.9467
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 522 score: 0.9215
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 523 score: 0.9033
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 524 score: 0.9220
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 525 score: 0.9380
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 526 score: 0.8370
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 527 score: 0.7615
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 528 score: 0.8279
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 529 score: 0.9171
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 530 score: 0.8152
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 531 score: 0.8675
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 532 score: 0.9209
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 533 score: 0.9073
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 534 score: 0.8533
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 535 score: 0.8333
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 536 score: 0.8576
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 537 score: 0.9131
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 538 score: 0.9332
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 539 score: 0.9183
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 540 score: 0.9085
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 541 score: 0.9442
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 542 score: 0.8964
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 543 score: 0.9004
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 544 score: 0.9016
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 545 score: 0.9735
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 546 score: 0.7824
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 547 score: 0.8213
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 548 score: 0.8792
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 549 score: 0.9363
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 550 score: 0.8786
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 551 score: 0.9212
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 552 score: 0.9470
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 553 score: 0.9154
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 554 score: 0.9100
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 555 score: 0.8967
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 556 score: 0.8861
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 557 score: 0.8972
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 558 score: 0.8215
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 559 score: 0.8494
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 560 score: 0.7834
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 561 score: 0.9214
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 562 score: 0.8399
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 563 score: 0.5098
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 564 score: 0.8348
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 565 score: 0.9346
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 566 score: 0.9110
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 567 score: 0.9237
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 568 score: 0.8759
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 569 score: 0.8098
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 570 score: 0.9198
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 571 score: 0.8715
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 572 score: 0.8724
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 573 score: 0.9252
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 574 score: 0.9589
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 575 score: 0.8386
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 576 score: 0.5785
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 577 score: 0.9127
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 578 score: 0.9189
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 579 score: 0.9334
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 580 score: 0.9304
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 581 score: 0.9135
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 582 score: 0.9305
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 583 score: 0.8853
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 584 score: 0.7536
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 585 score: 0.9398
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 586 score: 0.8937
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 587 score: 0.9532
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 588 score: 0.9195
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 589 score: 0.9534
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 590 score: 0.8477
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 591 score: 0.9215
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 592 score: 0.8648
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 593 score: 0.9174
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 594 score: 0.9568
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 595 score: 0.9473
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 596 score: 0.8987
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 597 score: 0.9055
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 598 score: 0.8638
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 599 score: 0.9545
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 600 score: 0.9185
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 601 score: 0.8774
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 602 score: 0.9120
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 603 score: 0.8978
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 604 score: 0.9440
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 605 score: 0.9123
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 606 score: 0.9394
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 607 score: 0.8350
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 608 score: 0.8934
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 609 score: 0.9054
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 610 score: 0.9446
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 611 score: 0.9214
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 612 score: 0.9074
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 613 score: 0.8961
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 614 score: 0.9500
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 615 score: 0.8635
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 616 score: 0.9307
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 617 score: 0.9237
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 618 score: 0.9074
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 619 score: 0.8883
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 620 score: 0.8839
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 621 score: 0.8050
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 622 score: 0.9264
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 623 score: 0.9427
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 624 score: 0.9244
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 625 score: 0.9471
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 626 score: 0.9314
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 627 score: 0.9413
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 628 score: 0.9479
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 629 score: 0.9376
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 630 score: 0.9585
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 631 score: 0.9467
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 632 score: 0.9098
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 633 score: 0.9407
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 634 score: 0.9828
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 635 score: 0.9558
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 636 score: 0.9418
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 637 score: 0.8924
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 638 score: 0.9119
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 639 score: 0.9514
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 640 score: 0.9307
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 641 score: 0.9506
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 642 score: 0.8824
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 643 score: 0.7228
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 644 score: 0.8808
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 645 score: 0.8873
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 646 score: 0.9446
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 647 score: 0.8920
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 648 score: 0.8476
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 649 score: 0.9170
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 650 score: 0.9561
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 651 score: 0.9175
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 652 score: 0.5329
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 653 score: 0.6986
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 654 score: 0.9198
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 655 score: 0.9031
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 656 score: 0.8494
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 657 score: 0.8210
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 658 score: 0.8478
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 659 score: 0.9054
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 660 score: 0.8421
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 661 score: 0.9295
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 662 score: 0.9495
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 663 score: 0.9085
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 664 score: 0.9511
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 665 score: 0.8702
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 666 score: 0.9160
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 667 score: 0.7587
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 668 score: 0.9457
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 669 score: 0.9298
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 670 score: 0.9104
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 671 score: 0.9254
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 672 score: 0.9202
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 673 score: 0.9360
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 674 score: 0.9212
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 675 score: 0.9396
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 676 score: 0.8899
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 677 score: 0.9213
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 678 score: 0.9457
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 679 score: 0.9332
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 680 score: 0.9185
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 681 score: 0.9497
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 682 score: 0.8951
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 683 score: 0.8881
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 684 score: 0.9246
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 685 score: 0.8775
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 686 score: 0.8647
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 687 score: 0.9009
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 688 score: 0.9291
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 689 score: 0.9125
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 690 score: 0.9157
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 691 score: 0.9015
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 692 score: 0.8973
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 693 score: 0.8886
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 694 score: 0.8522
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 695 score: 0.9494
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 696 score: 0.9229
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 697 score: 0.9287
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 698 score: 0.8497
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 699 score: 0.9067
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 700 score: 0.8435
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 701 score: 0.9495
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 702 score: 0.9706
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 703 score: 0.7918
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 704 score: 0.8742
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 705 score: 0.8919
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 706 score: 0.8556
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 707 score: 0.9028
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 708 score: 0.9075
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 709 score: 0.8833
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 710 score: 0.9342
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 711 score: 0.9059
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 712 score: 0.9435
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 713 score: 0.9391
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 714 score: 0.9110
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 715 score: 0.8759
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 716 score: 0.9130
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 717 score: 0.9370
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 718 score: 0.9287
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 719 score: 0.9274
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 720 score: 0.9079
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 721 score: 0.9151
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 722 score: 0.9285
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 723 score: 0.9310
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 724 score: 0.8715
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 725 score: 0.9161
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 726 score: 0.8932
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 727 score: 0.9273
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 728 score: 0.8331
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 729 score: 0.8617
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 730 score: 0.8773
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 731 score: 0.9068
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 732 score: 0.8737
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 733 score: 0.9520
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 734 score: 0.9194
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 735 score: 0.9337
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 736 score: 0.9176
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 737 score: 0.9060
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 738 score: 0.9229
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 739 score: 0.8948
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 740 score: 0.8445
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 741 score: 0.8824
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 742 score: 0.8659
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 743 score: 0.9432
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 744 score: 0.9540
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 745 score: 0.9311
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 746 score: 0.9474
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 747 score: 0.9193
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 748 score: 0.9706
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 749 score: 0.9508
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 750 score: 0.9608
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 751 score: 0.8665
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 752 score: 0.9257
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 753 score: 0.9032
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 754 score: 0.8682
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 755 score: 0.9154
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 756 score: 0.8821
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 757 score: 0.9104
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 758 score: 0.8766
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 759 score: 0.9200
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 760 score: 0.9343
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 761 score: 0.9252
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 762 score: 0.9569
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 763 score: 0.9173
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 764 score: 0.9237
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 765 score: 0.8704
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 766 score: 0.9203
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 767 score: 0.9009
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 768 score: 0.9545
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 769 score: 0.9578
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 770 score: 0.9231
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 771 score: 0.9226
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 772 score: 0.9291
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 773 score: 0.9452
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 774 score: 0.8978
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 775 score: 0.8808
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 776 score: 0.8916
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 777 score: 0.9319
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 778 score: 0.8575
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 779 score: 0.8412
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 780 score: 0.8606
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 781 score: 0.7972
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 782 score: 0.9310
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 783 score: 0.8327
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 784 score: 0.9376
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 785 score: 0.8204
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 786 score: 0.8804
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 787 score: 0.9210
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 788 score: 0.9272
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 789 score: 0.9215
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 790 score: 0.9385
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 791 score: 0.9304
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 792 score: 0.9059
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 793 score: 0.8881
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 794 score: 0.9201
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 795 score: 0.8833
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 796 score: 0.9591
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 797 score: 0.8819
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 798 score: 0.9311
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 799 score: 0.8732
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 800 score: 0.9154
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 801 score: 0.8780
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 802 score: 0.9280
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 803 score: 0.8220
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 804 score: 0.9075
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 805 score: 0.9326
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 806 score: 0.9508
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 807 score: 0.8884
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 808 score: 0.9150
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 809 score: 0.8821
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 810 score: 0.9564
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 811 score: 0.8680
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 812 score: 0.9531
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 813 score: 0.9520
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 814 score: 0.9178
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 815 score: 0.8804
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 816 score: 0.9089
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 817 score: 0.7499
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 818 score: 0.8389
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 819 score: 0.9010
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 820 score: 0.8912
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 821 score: 0.9587
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 822 score: 0.9014
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 823 score: 0.9079
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 824 score: 0.9046
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 825 score: 0.9471
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 826 score: 0.9266
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 827 score: 0.9425
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 828 score: 0.8881
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 829 score: 0.9072
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 830 score: 0.9096
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 831 score: 0.8527
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 832 score: 0.9462
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 833 score: 0.7423
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 834 score: 0.9143
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 835 score: 0.8518
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 836 score: 0.9220
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 837 score: 0.8740
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 838 score: 0.8682
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 839 score: 0.8823
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 840 score: 0.9244
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 841 score: 0.8132
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 842 score: 0.6488
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 843 score: 0.8886
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 844 score: 0.7729
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 845 score: 0.8702
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 846 score: 0.7840
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 847 score: 0.8650
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 848 score: 0.7315
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 849 score: 0.8694
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 850 score: 0.9033
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 851 score: 0.9264
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 852 score: 0.8885
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 853 score: 0.8679
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 854 score: 0.8079
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 855 score: 0.8397
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 856 score: 0.7086
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 857 score: 0.9386
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 858 score: 0.9299
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 859 score: 0.9355
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 860 score: 0.9115
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 861 score: 0.9389
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 862 score: 0.9150
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 863 score: 0.8528
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 864 score: 0.7558
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 865 score: 0.8000
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 866 score: 0.9008
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 867 score: 0.9245
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 868 score: 0.8955
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 869 score: 0.9279
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 870 score: 0.9422
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 871 score: 0.9480
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 872 score: 0.9348
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 873 score: 0.9168
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 874 score: 0.9399
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 875 score: 0.8776
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 876 score: 0.8262
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 877 score: 0.8955
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 878 score: 0.9677
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 879 score: 0.9354
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 880 score: 0.9221
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 881 score: 0.9411
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 882 score: 0.8884
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 883 score: 0.9362
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 884 score: 0.8684
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 885 score: 0.8807
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 886 score: 0.9148
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 887 score: 0.8658
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 888 score: 0.8085
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 889 score: 0.8492
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 890 score: 0.9191
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 891 score: 0.8922
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 892 score: 0.8633
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 893 score: 0.7958
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 894 score: 0.9294
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 895 score: 0.9383
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 896 score: 0.9472
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 897 score: 0.9224
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 898 score: 0.8402
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 899 score: 0.8377
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 900 score: 0.8534
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 901 score: 0.9165
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 902 score: 0.8722
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 903 score: 0.9289
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 904 score: 0.9334
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 905 score: 0.8094
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 906 score: 0.9300
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 907 score: 0.8829
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 908 score: 0.8657
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 909 score: 0.9570
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 910 score: 0.8707
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 911 score: 0.8426
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 912 score: 0.9321
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 913 score: 0.8888
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 914 score: 0.8338
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 915 score: 0.9109
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 916 score: 0.9419
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 917 score: 0.9359
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 918 score: 0.9549
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 919 score: 0.8956
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 920 score: 0.7242
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 921 score: 0.9007
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 922 score: 0.9302
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 923 score: 0.8821
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 924 score: 0.9269
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 925 score: 0.9191
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 926 score: 0.9518
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 927 score: 0.9100
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 928 score: 0.9253
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 929 score: 0.8601
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 930 score: 0.8777
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 931 score: 0.7736
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 932 score: 0.7827
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 933 score: 0.9008
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 934 score: 0.8313
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 935 score: 0.8637
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 936 score: 0.9129
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 937 score: 0.9653
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 938 score: 0.9561
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 939 score: 0.9307
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 940 score: 0.9607
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 941 score: 0.9763
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 942 score: 0.9572
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 943 score: 0.8762
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 944 score: 0.8650
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 945 score: 0.9434
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 946 score: 0.9078
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 947 score: 0.7829
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 948 score: 0.8762
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 949 score: 0.9101
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 950 score: 0.8678
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 951 score: 0.9404
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 952 score: 0.9050
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 953 score: 0.9125
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 954 score: 0.8829
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 955 score: 0.9274
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 956 score: 0.9395
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 957 score: 0.9477
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 958 score: 0.9082
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 959 score: 0.8567
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 960 score: 0.7555
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 961 score: 0.9193
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 962 score: 0.9264
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 963 score: 0.9392
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 964 score: 0.9423
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 965 score: 0.8839
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 966 score: 0.9000
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 967 score: 0.8863
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 968 score: 0.9187
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 969 score: 0.7883
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 970 score: 0.9028
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 971 score: 0.8854
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 972 score: 0.8764
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 973 score: 0.9052
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 974 score: 0.9133
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 975 score: 0.9393
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 976 score: 0.8191
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 977 score: 0.8578
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 978 score: 0.9331
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 979 score: 0.9127
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 980 score: 0.9134
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 981 score: 0.8946
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 982 score: 0.7415
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 983 score: 0.7825
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 984 score: 0.9531
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 985 score: 0.8998
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 986 score: 0.8336
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 987 score: 0.9099
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 988 score: 0.8551
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 989 score: 0.7868
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 990 score: 0.8985
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 991 score: 0.8410
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 992 score: 0.9180
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 993 score: 0.8892
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 994 score: 0.8386
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 995 score: 0.9070
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 996 score: 0.9194
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 997 score: 0.9601
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 998 score: 0.9389
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 999 score: 0.8448
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 1000 score: 0.9302
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 1001 score: 0.8446
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 1002 score: 0.9179
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 1003 score: 0.8897
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 1004 score: 0.7626
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 1005 score: 0.9159
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 1006 score: 0.8460
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 1007 score: 0.9522
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 1008 score: 0.9530
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 1009 score: 0.9168
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 1010 score: 0.8886
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk Segment 1011 score: 0.9002
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-mk-max-tokens-512/test-en-mk score: 0.8944