TongZheng1999's picture
Upload folder using huggingface_hub
fa15376 verified
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 0 score: 0.8049
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 1 score: 0.9309
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 2 score: 0.9368
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 3 score: 0.9058
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 4 score: 0.9388
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 5 score: 0.8002
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 6 score: 0.9256
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 7 score: 0.8988
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 8 score: 0.8368
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 9 score: 0.8473
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 10 score: 0.9486
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 11 score: 0.8013
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 12 score: 0.9056
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 13 score: 0.9370
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 14 score: 0.9023
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 15 score: 0.7901
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 16 score: 0.9012
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 17 score: 0.9553
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 18 score: 0.9384
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 19 score: 0.9061
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 20 score: 0.9471
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 21 score: 0.9519
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 22 score: 0.7839
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 23 score: 0.9356
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 24 score: 0.9416
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 25 score: 0.9388
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 26 score: 0.8931
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 27 score: 0.9012
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 28 score: 0.7095
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 29 score: 0.9218
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 30 score: 0.7244
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 31 score: 0.8938
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 32 score: 0.7995
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 33 score: 0.9475
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 34 score: 0.9583
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 35 score: 0.9453
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 36 score: 0.9272
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 37 score: 0.8423
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 38 score: 0.8859
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 39 score: 0.8938
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 40 score: 0.8910
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 41 score: 0.9197
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 42 score: 0.9378
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 43 score: 0.9470
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 44 score: 0.8477
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 45 score: 0.9086
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 46 score: 0.9206
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 47 score: 0.8553
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 48 score: 0.9221
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 49 score: 0.9510
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 50 score: 0.9630
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 51 score: 0.9203
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 52 score: 0.9602
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 53 score: 0.9668
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 54 score: 0.9291
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 55 score: 0.9530
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 56 score: 0.9329
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 57 score: 0.8900
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 58 score: 0.8173
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 59 score: 0.9697
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 60 score: 0.9241
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 61 score: 0.9610
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 62 score: 0.8236
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 63 score: 0.9416
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 64 score: 0.9327
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 65 score: 0.6923
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 66 score: 0.7176
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 67 score: 0.6809
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 68 score: 0.9589
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 69 score: 0.8931
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 70 score: 0.9022
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 71 score: 0.8972
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 72 score: 0.8978
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 73 score: 0.9173
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 74 score: 0.8710
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 75 score: 0.8706
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 76 score: 0.9262
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 77 score: 0.9650
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 78 score: 0.9599
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 79 score: 0.8984
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 80 score: 0.8908
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 81 score: 0.9517
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 82 score: 0.9049
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 83 score: 0.8265
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 84 score: 0.9432
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 85 score: 0.9529
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 86 score: 0.8650
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 87 score: 0.8821
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 88 score: 0.9382
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 89 score: 0.9174
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 90 score: 0.8854
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 91 score: 0.9259
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 92 score: 0.8704
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 93 score: 0.8753
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 94 score: 0.9519
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 95 score: 0.9599
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 96 score: 0.8286
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 97 score: 0.9351
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 98 score: 0.9113
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 99 score: 0.8825
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 100 score: 0.9489
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 101 score: 0.9557
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 102 score: 0.9368
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 103 score: 0.9764
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 104 score: 0.9646
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 105 score: 0.8874
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 106 score: 0.9508
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 107 score: 0.9234
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 108 score: 0.8932
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 109 score: 0.7270
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 110 score: 0.9092
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 111 score: 0.9641
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 112 score: 0.9703
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 113 score: 0.9742
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 114 score: 0.9181
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 115 score: 0.9460
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 116 score: 0.9234
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 117 score: 0.9580
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 118 score: 0.9728
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 119 score: 0.9157
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 120 score: 0.8410
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 121 score: 0.9245
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 122 score: 0.9391
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 123 score: 0.9578
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 124 score: 0.9238
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 125 score: 0.9508
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 126 score: 0.8829
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 127 score: 0.8920
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 128 score: 0.9548
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 129 score: 0.9434
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 130 score: 0.9282
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 131 score: 0.9397
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 132 score: 0.9501
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 133 score: 0.9553
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 134 score: 0.8397
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 135 score: 0.9068
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 136 score: 0.9270
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 137 score: 0.9378
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 138 score: 0.9170
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 139 score: 0.9244
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 140 score: 0.9304
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 141 score: 0.9027
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 142 score: 0.9580
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 143 score: 0.9121
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 144 score: 0.9402
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 145 score: 0.9565
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 146 score: 0.9232
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 147 score: 0.9049
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 148 score: 0.9273
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 149 score: 0.9420
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 150 score: 0.9333
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 151 score: 0.8172
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 152 score: 0.8595
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 153 score: 0.8369
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 154 score: 0.8841
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 155 score: 0.9103
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 156 score: 0.9262
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 157 score: 0.8003
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 158 score: 0.9556
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 159 score: 0.8623
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 160 score: 0.9335
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 161 score: 0.8723
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 162 score: 0.9432
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 163 score: 0.8876
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 164 score: 0.9324
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 165 score: 0.8922
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 166 score: 0.9490
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 167 score: 0.9193
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 168 score: 0.9304
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 169 score: 0.9057
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 170 score: 0.9210
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 171 score: 0.9300
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 172 score: 0.9071
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 173 score: 0.8410
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 174 score: 0.9360
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 175 score: 0.9694
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 176 score: 0.8331
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 177 score: 0.9261
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 178 score: 0.7411
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 179 score: 0.9324
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 180 score: 0.8449
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 181 score: 0.8628
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 182 score: 0.9339
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 183 score: 0.9411
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 184 score: 0.8275
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 185 score: 0.9581
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 186 score: 0.9543
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 187 score: 0.9261
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 188 score: 0.8702
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 189 score: 0.9300
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 190 score: 0.8406
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 191 score: 0.9380
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 192 score: 0.9068
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 193 score: 0.9142
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 194 score: 0.8890
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 195 score: 0.9397
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 196 score: 0.9286
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 197 score: 0.8646
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 198 score: 0.9435
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 199 score: 0.9323
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 200 score: 0.8162
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 201 score: 0.8312
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 202 score: 0.8020
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 203 score: 0.8614
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 204 score: 0.9221
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 205 score: 0.9145
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 206 score: 0.8858
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 207 score: 0.9336
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 208 score: 0.9524
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 209 score: 0.9514
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 210 score: 0.9678
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 211 score: 0.9444
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 212 score: 0.9358
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 213 score: 0.9385
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 214 score: 0.9468
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 215 score: 0.9304
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 216 score: 0.8629
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 217 score: 0.9280
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 218 score: 0.9103
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 219 score: 0.9387
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 220 score: 0.9736
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 221 score: 0.9347
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 222 score: 0.9443
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 223 score: 0.9142
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 224 score: 0.9498
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 225 score: 0.9746
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 226 score: 0.9129
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 227 score: 0.8706
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 228 score: 0.9324
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 229 score: 0.9347
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 230 score: 0.9630
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 231 score: 0.9200
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 232 score: 0.8650
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 233 score: 0.8854
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 234 score: 0.8476
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 235 score: 0.8637
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 236 score: 0.8674
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 237 score: 0.9016
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 238 score: 0.9532
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 239 score: 0.9322
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 240 score: 0.8815
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 241 score: 0.8615
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 242 score: 0.9544
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 243 score: 0.8492
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 244 score: 0.9110
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 245 score: 0.8296
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 246 score: 0.8095
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 247 score: 0.8867
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 248 score: 0.8497
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 249 score: 0.9235
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 250 score: 0.9014
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 251 score: 0.9478
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 252 score: 0.9518
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 253 score: 0.8470
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 254 score: 0.9680
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 255 score: 0.9070
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 256 score: 0.9163
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 257 score: 0.9467
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 258 score: 0.9247
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 259 score: 0.9556
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 260 score: 0.9625
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 261 score: 0.7804
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 262 score: 0.9579
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 263 score: 0.9196
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 264 score: 0.9446
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 265 score: 0.9144
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 266 score: 0.8865
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 267 score: 0.8207
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 268 score: 0.9403
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 269 score: 0.9174
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 270 score: 0.9242
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 271 score: 0.8656
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 272 score: 0.9303
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 273 score: 0.8949
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 274 score: 0.7811
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 275 score: 0.8464
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 276 score: 0.9082
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 277 score: 0.9407
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 278 score: 0.8935
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 279 score: 0.8577
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 280 score: 0.9024
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 281 score: 0.9072
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 282 score: 0.9432
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 283 score: 0.9336
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 284 score: 0.8841
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 285 score: 0.9678
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 286 score: 0.9109
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 287 score: 0.8590
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 288 score: 0.9283
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 289 score: 0.9033
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 290 score: 0.8632
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 291 score: 0.9121
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 292 score: 0.9282
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 293 score: 0.9187
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 294 score: 0.8654
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 295 score: 0.7462
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 296 score: 0.8642
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 297 score: 0.9311
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 298 score: 0.6923
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 299 score: 0.9393
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 300 score: 0.9067
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 301 score: 0.8939
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 302 score: 0.9208
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 303 score: 0.9571
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 304 score: 0.9600
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 305 score: 0.9517
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 306 score: 0.8761
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 307 score: 0.9094
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 308 score: 0.9403
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 309 score: 0.8392
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 310 score: 0.9407
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 311 score: 0.9411
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 312 score: 0.9493
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 313 score: 0.8638
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 314 score: 0.9590
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 315 score: 0.9522
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 316 score: 0.9486
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 317 score: 0.9082
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 318 score: 0.8217
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 319 score: 0.8569
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 320 score: 0.8507
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 321 score: 0.9165
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 322 score: 0.9342
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 323 score: 0.9181
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 324 score: 0.9459
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 325 score: 0.9133
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 326 score: 0.8470
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 327 score: 0.9276
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 328 score: 0.8638
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 329 score: 0.9292
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 330 score: 0.9345
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 331 score: 0.9328
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 332 score: 0.9311
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 333 score: 0.9361
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 334 score: 0.9596
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 335 score: 0.8999
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 336 score: 0.9083
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 337 score: 0.2538
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 338 score: 0.9363
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 339 score: 0.8945
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 340 score: 0.8336
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 341 score: 0.7635
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 342 score: 0.7616
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 343 score: 0.8346
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 344 score: 0.9213
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 345 score: 0.9181
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 346 score: 0.9447
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 347 score: 0.9260
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 348 score: 0.8745
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 349 score: 0.9171
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 350 score: 0.9140
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 351 score: 0.9433
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 352 score: 0.9360
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 353 score: 0.9547
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 354 score: 0.9751
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 355 score: 0.9158
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 356 score: 0.9310
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 357 score: 0.9302
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 358 score: 0.7194
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 359 score: 0.8367
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 360 score: 0.8474
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 361 score: 0.9218
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 362 score: 0.9649
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 363 score: 0.5965
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 364 score: 0.9320
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 365 score: 0.8834
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 366 score: 0.8573
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 367 score: 0.8783
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 368 score: 0.7730
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 369 score: 0.9220
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 370 score: 0.8378
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 371 score: 0.8357
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 372 score: 0.8923
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 373 score: 0.9047
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 374 score: 0.9568
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 375 score: 0.9085
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 376 score: 0.9475
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 377 score: 0.9462
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 378 score: 0.8080
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 379 score: 0.9330
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 380 score: 0.9567
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 381 score: 0.8990
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 382 score: 0.7588
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 383 score: 0.8811
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 384 score: 0.8976
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 385 score: 0.8625
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 386 score: 0.8112
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 387 score: 0.9359
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 388 score: 0.9366
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 389 score: 0.8669
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 390 score: 0.9285
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 391 score: 0.9055
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 392 score: 0.9400
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 393 score: 0.9725
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 394 score: 0.9536
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 395 score: 0.9727
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 396 score: 0.8700
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 397 score: 0.9425
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 398 score: 0.8301
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 399 score: 0.9510
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 400 score: 0.9617
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 401 score: 0.9187
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 402 score: 0.9417
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 403 score: 0.9209
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 404 score: 0.8353
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 405 score: 0.9308
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 406 score: 0.9208
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 407 score: 0.8996
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 408 score: 0.9404
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 409 score: 0.9502
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 410 score: 0.9344
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 411 score: 0.8625
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 412 score: 0.9059
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 413 score: 0.9183
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 414 score: 0.7467
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 415 score: 0.9254
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 416 score: 0.7928
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 417 score: 0.8125
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 418 score: 0.9474
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 419 score: 0.9394
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 420 score: 0.9490
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 421 score: 0.9698
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 422 score: 0.9489
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 423 score: 0.9384
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 424 score: 0.9147
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 425 score: 0.9406
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 426 score: 0.9429
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 427 score: 0.9183
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 428 score: 0.9294
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 429 score: 0.9590
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 430 score: 0.9312
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 431 score: 0.8642
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 432 score: 0.8552
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 433 score: 0.8432
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 434 score: 0.9044
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 435 score: 0.8855
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 436 score: 0.8809
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 437 score: 0.9242
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 438 score: 0.9477
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 439 score: 0.9103
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 440 score: 0.9323
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 441 score: 0.9284
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 442 score: 0.9768
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 443 score: 0.9431
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 444 score: 0.8267
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 445 score: 0.8432
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 446 score: 0.9460
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 447 score: 0.9545
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 448 score: 0.9374
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 449 score: 0.9068
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 450 score: 0.8190
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 451 score: 0.9422
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 452 score: 0.9655
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 453 score: 0.8899
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 454 score: 0.9330
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 455 score: 0.8179
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 456 score: 0.8189
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 457 score: 0.9503
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 458 score: 0.9000
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 459 score: 0.9511
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 460 score: 0.9557
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 461 score: 0.8842
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 462 score: 0.8470
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 463 score: 0.9518
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 464 score: 0.9350
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 465 score: 0.9178
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 466 score: 0.9115
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 467 score: 0.7592
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 468 score: 0.8612
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 469 score: 0.7852
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 470 score: 0.7753
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 471 score: 0.9084
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 472 score: 0.9302
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 473 score: 0.9267
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 474 score: 0.8929
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 475 score: 0.9363
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 476 score: 0.9234
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 477 score: 0.9303
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 478 score: 0.8561
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 479 score: 0.9496
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 480 score: 0.8411
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 481 score: 0.9040
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 482 score: 0.8983
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 483 score: 0.9214
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 484 score: 0.9231
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 485 score: 0.9406
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 486 score: 0.9236
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 487 score: 0.9143
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 488 score: 0.9648
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 489 score: 0.8814
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 490 score: 0.9211
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 491 score: 0.9527
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 492 score: 0.9392
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 493 score: 0.9549
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 494 score: 0.8928
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 495 score: 0.8963
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 496 score: 0.8912
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 497 score: 0.8732
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 498 score: 0.9049
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 499 score: 0.9482
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 500 score: 0.9496
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 501 score: 0.9291
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 502 score: 0.9435
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 503 score: 0.9057
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 504 score: 0.7938
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 505 score: 0.8911
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 506 score: 0.8409
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 507 score: 0.8866
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 508 score: 0.7286
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 509 score: 0.8716
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 510 score: 0.8048
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 511 score: 0.8811
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 512 score: 0.9405
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 513 score: 0.8984
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 514 score: 0.9415
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 515 score: 0.9423
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 516 score: 0.8885
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 517 score: 0.9407
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 518 score: 0.8964
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 519 score: 0.9568
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 520 score: 0.9233
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 521 score: 0.9343
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 522 score: 0.9205
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 523 score: 0.8555
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 524 score: 0.9456
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 525 score: 0.9502
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 526 score: 0.9219
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 527 score: 0.9080
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 528 score: 0.9211
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 529 score: 0.9158
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 530 score: 0.9076
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 531 score: 0.9168
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 532 score: 0.9252
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 533 score: 0.9152
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 534 score: 0.8332
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 535 score: 0.8430
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 536 score: 0.8997
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 537 score: 0.7560
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 538 score: 0.8863
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 539 score: 0.9303
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 540 score: 0.8570
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 541 score: 0.8959
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 542 score: 0.9308
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 543 score: 0.9130
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 544 score: 0.9353
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 545 score: 0.9684
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 546 score: 0.8294
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 547 score: 0.7685
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 548 score: 0.8004
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 549 score: 0.9688
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 550 score: 0.8481
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 551 score: 0.9421
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 552 score: 0.9417
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 553 score: 0.9311
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 554 score: 0.9223
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 555 score: 0.9308
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 556 score: 0.8726
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 557 score: 0.9711
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 558 score: 0.8294
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 559 score: 0.8414
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 560 score: 0.9610
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 561 score: 0.9426
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 562 score: 0.8948
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 563 score: 0.9454
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 564 score: 0.8699
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 565 score: 0.9375
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 566 score: 0.9372
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 567 score: 0.9016
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 568 score: 0.8542
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 569 score: 0.7739
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 570 score: 0.9305
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 571 score: 0.9068
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 572 score: 0.8615
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 573 score: 0.9461
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 574 score: 0.9460
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 575 score: 0.8582
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 576 score: 0.9208
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 577 score: 0.9575
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 578 score: 0.9403
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 579 score: 0.8898
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 580 score: 0.9409
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 581 score: 0.8227
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 582 score: 0.9447
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 583 score: 0.7767
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 584 score: 0.7226
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 585 score: 0.9336
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 586 score: 0.9506
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 587 score: 0.8891
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 588 score: 0.9266
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 589 score: 0.9639
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 590 score: 0.9372
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 591 score: 0.9289
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 592 score: 0.7396
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 593 score: 0.9370
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 594 score: 0.9673
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 595 score: 0.9450
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 596 score: 0.9115
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 597 score: 0.9328
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 598 score: 0.9084
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 599 score: 0.9151
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 600 score: 0.9173
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 601 score: 0.8853
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 602 score: 0.9151
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 603 score: 0.9166
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 604 score: 0.9116
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 605 score: 0.9355
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 606 score: 0.9227
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 607 score: 0.8998
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 608 score: 0.8697
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 609 score: 0.9252
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 610 score: 0.9296
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 611 score: 0.9524
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 612 score: 0.9404
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 613 score: 0.9184
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 614 score: 0.9349
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 615 score: 0.9439
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 616 score: 0.9314
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 617 score: 0.9641
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 618 score: 0.9360
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 619 score: 0.9424
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 620 score: 0.9343
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 621 score: 0.8901
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 622 score: 0.9432
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 623 score: 0.9275
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 624 score: 0.9316
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 625 score: 0.9615
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 626 score: 0.9639
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 627 score: 0.9597
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 628 score: 0.9406
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 629 score: 0.9129
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 630 score: 0.9073
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 631 score: 0.9621
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 632 score: 0.9596
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 633 score: 0.9597
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 634 score: 0.9595
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 635 score: 0.9509
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 636 score: 0.9302
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 637 score: 0.8928
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 638 score: 0.9609
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 639 score: 0.9670
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 640 score: 0.9244
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 641 score: 0.9399
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 642 score: 0.8930
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 643 score: 0.7174
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 644 score: 0.8871
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 645 score: 0.8389
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 646 score: 0.9028
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 647 score: 0.9115
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 648 score: 0.8245
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 649 score: 0.8735
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 650 score: 0.9613
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 651 score: 0.8869
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 652 score: 0.7734
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 653 score: 0.8588
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 654 score: 0.8987
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 655 score: 0.9120
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 656 score: 0.9215
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 657 score: 0.8210
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 658 score: 0.8380
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 659 score: 0.9167
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 660 score: 0.8800
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 661 score: 0.9406
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 662 score: 0.9647
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 663 score: 0.8912
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 664 score: 0.9600
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 665 score: 0.8844
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 666 score: 0.9170
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 667 score: 0.9468
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 668 score: 0.9157
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 669 score: 0.9470
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 670 score: 0.9030
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 671 score: 0.9349
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 672 score: 0.9192
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 673 score: 0.8821
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 674 score: 0.9421
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 675 score: 0.9344
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 676 score: 0.9421
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 677 score: 0.9655
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 678 score: 0.9201
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 679 score: 0.9483
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 680 score: 0.8728
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 681 score: 0.9278
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 682 score: 0.9277
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 683 score: 0.8202
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 684 score: 0.9151
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 685 score: 0.9282
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 686 score: 0.8784
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 687 score: 0.8989
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 688 score: 0.9345
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 689 score: 0.9221
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 690 score: 0.9345
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 691 score: 0.9032
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 692 score: 0.9332
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 693 score: 0.7746
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 694 score: 0.8994
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 695 score: 0.9184
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 696 score: 0.9094
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 697 score: 0.8932
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 698 score: 0.8950
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 699 score: 0.9535
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 700 score: 0.8905
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 701 score: 0.9089
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 702 score: 0.9629
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 703 score: 0.8929
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 704 score: 0.9425
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 705 score: 0.9041
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 706 score: 0.7702
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 707 score: 0.9408
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 708 score: 0.9193
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 709 score: 0.9374
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 710 score: 0.9627
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 711 score: 0.9066
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 712 score: 0.9664
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 713 score: 0.9459
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 714 score: 0.9424
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 715 score: 0.9010
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 716 score: 0.9346
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 717 score: 0.9418
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 718 score: 0.9480
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 719 score: 0.9511
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 720 score: 0.9602
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 721 score: 0.8872
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 722 score: 0.9347
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 723 score: 0.9563
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 724 score: 0.9440
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 725 score: 0.9327
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 726 score: 0.9077
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 727 score: 0.9138
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 728 score: 0.6614
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 729 score: 0.9048
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 730 score: 0.8994
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 731 score: 0.9403
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 732 score: 0.8396
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 733 score: 0.9600
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 734 score: 0.8941
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 735 score: 0.9275
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 736 score: 0.9397
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 737 score: 0.9135
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 738 score: 0.9271
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 739 score: 0.9477
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 740 score: 0.9298
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 741 score: 0.9226
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 742 score: 0.9004
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 743 score: 0.9543
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 744 score: 0.9371
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 745 score: 0.9065
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 746 score: 0.9421
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 747 score: 0.9472
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 748 score: 0.9696
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 749 score: 0.9503
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 750 score: 0.9403
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 751 score: 0.8388
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 752 score: 0.9052
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 753 score: 0.9304
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 754 score: 0.9145
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 755 score: 0.9317
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 756 score: 0.9182
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 757 score: 0.9237
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 758 score: 0.9297
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 759 score: 0.9467
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 760 score: 0.9542
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 761 score: 0.9422
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 762 score: 0.9565
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 763 score: 0.8695
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 764 score: 0.9363
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 765 score: 0.8867
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 766 score: 0.9402
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 767 score: 0.9223
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 768 score: 0.9727
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 769 score: 0.9475
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 770 score: 0.9397
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 771 score: 0.9418
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 772 score: 0.9383
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 773 score: 0.9187
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 774 score: 0.9356
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 775 score: 0.8365
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 776 score: 0.8913
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 777 score: 0.9692
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 778 score: 0.8801
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 779 score: 0.7768
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 780 score: 0.9238
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 781 score: 0.8168
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 782 score: 0.9174
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 783 score: 0.7556
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 784 score: 0.9200
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 785 score: 0.8185
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 786 score: 0.8937
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 787 score: 0.9442
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 788 score: 0.9524
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 789 score: 0.9354
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 790 score: 0.9332
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 791 score: 0.9085
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 792 score: 0.9201
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 793 score: 0.8184
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 794 score: 0.9182
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 795 score: 0.9163
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 796 score: 0.9757
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 797 score: 0.8378
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 798 score: 0.9475
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 799 score: 0.8329
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 800 score: 0.9418
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 801 score: 0.8679
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 802 score: 0.9309
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 803 score: 0.9063
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 804 score: 0.7824
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 805 score: 0.9389
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 806 score: 0.9362
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 807 score: 0.9355
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 808 score: 0.9172
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 809 score: 0.8803
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 810 score: 0.8954
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 811 score: 0.8578
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 812 score: 0.9600
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 813 score: 0.9535
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 814 score: 0.9249
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 815 score: 0.7613
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 816 score: 0.8563
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 817 score: 0.8905
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 818 score: 0.8141
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 819 score: 0.9185
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 820 score: 0.9463
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 821 score: 0.9539
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 822 score: 0.9401
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 823 score: 0.9238
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 824 score: 0.9239
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 825 score: 0.9202
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 826 score: 0.9119
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 827 score: 0.9297
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 828 score: 0.9150
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 829 score: 0.9427
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 830 score: 0.9059
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 831 score: 0.9235
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 832 score: 0.9092
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 833 score: 0.8782
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 834 score: 0.9175
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 835 score: 0.7859
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 836 score: 0.9463
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 837 score: 0.8998
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 838 score: 0.9208
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 839 score: 0.8819
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 840 score: 0.9352
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 841 score: 0.8897
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 842 score: 0.8130
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 843 score: 0.8783
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 844 score: 0.8441
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 845 score: 0.9188
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 846 score: 0.6590
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 847 score: 0.8772
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 848 score: 0.8241
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 849 score: 0.9064
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 850 score: 0.8993
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 851 score: 0.9484
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 852 score: 0.9364
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 853 score: 0.8256
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 854 score: 0.9029
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 855 score: 0.8930
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 856 score: 0.8581
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 857 score: 0.9124
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 858 score: 0.9245
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 859 score: 0.9212
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 860 score: 0.9189
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 861 score: 0.9319
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 862 score: 0.9509
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 863 score: 0.9037
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 864 score: 0.8617
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 865 score: 0.8840
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 866 score: 0.8997
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 867 score: 0.9344
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 868 score: 0.9087
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 869 score: 0.9239
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 870 score: 0.8911
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 871 score: 0.9029
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 872 score: 0.9243
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 873 score: 0.9357
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 874 score: 0.9284
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 875 score: 0.9030
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 876 score: 0.9195
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 877 score: 0.8929
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 878 score: 0.9596
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 879 score: 0.8661
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 880 score: 0.9120
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 881 score: 0.9498
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 882 score: 0.9337
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 883 score: 0.9502
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 884 score: 0.8849
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 885 score: 0.9286
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 886 score: 0.9472
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 887 score: 0.7959
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 888 score: 0.8680
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 889 score: 0.8675
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 890 score: 0.9212
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 891 score: 0.9303
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 892 score: 0.8751
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 893 score: 0.8681
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 894 score: 0.9020
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 895 score: 0.9494
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 896 score: 0.9284
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 897 score: 0.9183
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 898 score: 0.9624
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 899 score: 0.9107
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 900 score: 0.9107
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 901 score: 0.9484
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 902 score: 0.8816
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 903 score: 0.9386
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 904 score: 0.9158
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 905 score: 0.8484
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 906 score: 0.9141
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 907 score: 0.9206
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 908 score: 0.8927
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 909 score: 0.9533
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 910 score: 0.9207
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 911 score: 0.9276
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 912 score: 0.9446
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 913 score: 0.9152
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 914 score: 0.8858
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 915 score: 0.9258
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 916 score: 0.9374
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 917 score: 0.9396
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 918 score: 0.9526
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 919 score: 0.9271
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 920 score: 0.9065
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 921 score: 0.7991
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 922 score: 0.9191
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 923 score: 0.9105
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 924 score: 0.9262
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 925 score: 0.9085
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 926 score: 0.9658
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 927 score: 0.9524
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 928 score: 0.9315
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 929 score: 0.8959
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 930 score: 0.9108
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 931 score: 0.8118
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 932 score: 0.8073
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 933 score: 0.8858
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 934 score: 0.9113
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 935 score: 0.9111
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 936 score: 0.9232
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 937 score: 0.9757
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 938 score: 0.9594
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 939 score: 0.9392
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 940 score: 0.9642
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 941 score: 0.9791
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 942 score: 0.9584
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 943 score: 0.9125
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 944 score: 0.8380
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 945 score: 0.9459
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 946 score: 0.9360
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 947 score: 0.9264
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 948 score: 0.9144
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 949 score: 0.9372
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 950 score: 0.8455
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 951 score: 0.9285
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 952 score: 0.8450
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 953 score: 0.9493
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 954 score: 0.7579
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 955 score: 0.9536
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 956 score: 0.9505
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 957 score: 0.8896
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 958 score: 0.9290
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 959 score: 0.9291
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 960 score: 0.8309
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 961 score: 0.7331
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 962 score: 0.9330
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 963 score: 0.9559
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 964 score: 0.9569
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 965 score: 0.9280
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 966 score: 0.8884
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 967 score: 0.8943
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 968 score: 0.9527
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 969 score: 0.7556
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 970 score: 0.8959
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 971 score: 0.8814
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 972 score: 0.8515
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 973 score: 0.9356
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 974 score: 0.8943
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 975 score: 0.9423
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 976 score: 0.9172
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 977 score: 0.6410
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 978 score: 0.9352
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 979 score: 0.9302
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 980 score: 0.9539
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 981 score: 0.8844
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 982 score: 0.9513
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 983 score: 0.8822
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 984 score: 0.9480
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 985 score: 0.9440
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 986 score: 0.9031
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 987 score: 0.9234
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 988 score: 0.8683
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 989 score: 0.6374
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 990 score: 0.9257
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 991 score: 0.8846
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 992 score: 0.9260
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 993 score: 0.9242
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 994 score: 0.9631
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 995 score: 0.9306
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 996 score: 0.9536
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 997 score: 0.9733
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 998 score: 0.9056
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 999 score: 0.9140
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 1000 score: 0.9571
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 1001 score: 0.8603
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 1002 score: 0.9534
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 1003 score: 0.8770
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 1004 score: 0.9351
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 1005 score: 0.9453
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 1006 score: 0.9426
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 1007 score: 0.9247
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 1008 score: 0.9556
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 1009 score: 0.9028
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 1010 score: 0.9253
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg Segment 1011 score: 0.9161
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-bg-max-tokens-512/test-en-bg score: 0.9051