TongZheng1999's picture
Upload folder using huggingface_hub
357e605 verified
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 0 score: 0.8765
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 1 score: 0.8938
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 2 score: 0.9208
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 3 score: 0.8723
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 4 score: 0.7231
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 5 score: 0.7871
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 6 score: 0.8311
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 7 score: 0.9139
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 8 score: 0.9212
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 9 score: 0.9240
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 10 score: 0.9423
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 11 score: 0.9017
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 12 score: 0.9041
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 13 score: 0.9046
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 14 score: 0.7997
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 15 score: 0.7732
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 16 score: 0.8671
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 17 score: 0.9331
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 18 score: 0.8564
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 19 score: 0.8865
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 20 score: 0.9534
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 21 score: 0.9575
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 22 score: 0.9007
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 23 score: 0.9200
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 24 score: 0.8842
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 25 score: 0.9544
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 26 score: 0.9075
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 27 score: 0.8845
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 28 score: 0.8211
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 29 score: 0.8361
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 30 score: 0.7915
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 31 score: 0.8830
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 32 score: 0.8778
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 33 score: 0.9279
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 34 score: 0.9704
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 35 score: 0.9640
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 36 score: 0.9131
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 37 score: 0.9090
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 38 score: 0.8355
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 39 score: 0.8668
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 40 score: 0.8770
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 41 score: 0.9356
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 42 score: 0.9149
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 43 score: 0.9133
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 44 score: 0.9368
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 45 score: 0.8407
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 46 score: 0.8804
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 47 score: 0.8972
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 48 score: 0.9430
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 49 score: 0.9164
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 50 score: 0.8925
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 51 score: 0.9215
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 52 score: 0.9288
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 53 score: 0.9380
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 54 score: 0.9065
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 55 score: 0.9441
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 56 score: 0.9068
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 57 score: 0.9066
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 58 score: 0.9282
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 59 score: 0.9536
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 60 score: 0.9429
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 61 score: 0.9047
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 62 score: 0.8902
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 63 score: 0.9078
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 64 score: 0.9267
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 65 score: 0.8139
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 66 score: 0.8138
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 67 score: 0.7207
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 68 score: 0.9477
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 69 score: 0.9114
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 70 score: 0.8602
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 71 score: 0.8474
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 72 score: 0.9129
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 73 score: 0.8891
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 74 score: 0.8321
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 75 score: 0.8551
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 76 score: 0.8791
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 77 score: 0.9101
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 78 score: 0.9419
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 79 score: 0.9343
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 80 score: 0.9074
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 81 score: 0.9432
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 82 score: 0.8712
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 83 score: 0.8386
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 84 score: 0.8271
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 85 score: 0.9171
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 86 score: 0.7700
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 87 score: 0.9075
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 88 score: 0.9125
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 89 score: 0.9177
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 90 score: 0.9069
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 91 score: 0.9077
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 92 score: 0.8553
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 93 score: 0.8695
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 94 score: 0.8854
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 95 score: 0.9333
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 96 score: 0.9136
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 97 score: 0.9290
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 98 score: 0.9421
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 99 score: 0.9299
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 100 score: 0.9475
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 101 score: 0.8910
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 102 score: 0.9070
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 103 score: 0.9505
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 104 score: 0.9502
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 105 score: 0.8715
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 106 score: 0.9221
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 107 score: 0.8826
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 108 score: 0.8065
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 109 score: 0.7798
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 110 score: 0.9156
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 111 score: 0.9646
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 112 score: 0.9355
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 113 score: 0.9615
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 114 score: 0.9010
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 115 score: 0.9336
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 116 score: 0.9284
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 117 score: 0.9065
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 118 score: 0.9622
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 119 score: 0.8693
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 120 score: 0.8112
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 121 score: 0.8553
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 122 score: 0.9520
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 123 score: 0.9484
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 124 score: 0.9124
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 125 score: 0.9054
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 126 score: 0.9390
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 127 score: 0.9305
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 128 score: 0.9511
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 129 score: 0.9010
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 130 score: 0.8965
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 131 score: 0.9364
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 132 score: 0.9269
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 133 score: 0.9420
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 134 score: 0.8234
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 135 score: 0.8600
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 136 score: 0.9070
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 137 score: 0.9263
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 138 score: 0.9513
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 139 score: 0.8883
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 140 score: 0.8501
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 141 score: 0.7985
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 142 score: 0.9426
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 143 score: 0.8925
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 144 score: 0.9254
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 145 score: 0.9339
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 146 score: 0.9129
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 147 score: 0.9115
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 148 score: 0.9271
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 149 score: 0.9076
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 150 score: 0.9335
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 151 score: 0.8421
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 152 score: 0.8459
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 153 score: 0.8498
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 154 score: 0.7629
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 155 score: 0.8721
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 156 score: 0.9170
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 157 score: 0.7737
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 158 score: 0.9429
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 159 score: 0.9397
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 160 score: 0.9392
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 161 score: 0.8416
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 162 score: 0.9249
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 163 score: 0.9243
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 164 score: 0.9317
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 165 score: 0.8619
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 166 score: 0.9291
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 167 score: 0.8765
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 168 score: 0.8762
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 169 score: 0.7785
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 170 score: 0.8934
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 171 score: 0.9571
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 172 score: 0.8783
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 173 score: 0.8855
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 174 score: 0.8731
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 175 score: 0.9337
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 176 score: 0.8650
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 177 score: 0.9394
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 178 score: 0.9171
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 179 score: 0.9392
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 180 score: 0.9227
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 181 score: 0.9177
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 182 score: 0.9141
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 183 score: 0.8892
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 184 score: 0.9173
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 185 score: 0.9404
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 186 score: 0.9646
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 187 score: 0.8880
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 188 score: 0.8717
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 189 score: 0.9175
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 190 score: 0.8995
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 191 score: 0.9245
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 192 score: 0.8569
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 193 score: 0.8382
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 194 score: 0.9258
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 195 score: 0.9541
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 196 score: 0.8813
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 197 score: 0.8463
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 198 score: 0.8864
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 199 score: 0.8926
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 200 score: 0.8576
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 201 score: 0.8422
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 202 score: 0.8205
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 203 score: 0.8045
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 204 score: 0.9068
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 205 score: 0.8981
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 206 score: 0.9532
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 207 score: 0.8743
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 208 score: 0.8997
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 209 score: 0.8889
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 210 score: 0.9614
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 211 score: 0.9126
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 212 score: 0.9253
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 213 score: 0.9350
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 214 score: 0.9090
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 215 score: 0.9281
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 216 score: 0.9452
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 217 score: 0.9388
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 218 score: 0.9065
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 219 score: 0.9492
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 220 score: 0.9240
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 221 score: 0.9278
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 222 score: 0.9158
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 223 score: 0.8610
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 224 score: 0.8659
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 225 score: 0.9329
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 226 score: 0.8857
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 227 score: 0.7727
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 228 score: 0.9041
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 229 score: 0.9366
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 230 score: 0.8963
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 231 score: 0.9238
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 232 score: 0.8699
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 233 score: 0.9114
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 234 score: 0.8765
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 235 score: 0.9434
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 236 score: 0.9273
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 237 score: 0.8878
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 238 score: 0.9379
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 239 score: 0.9067
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 240 score: 0.7607
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 241 score: 0.8881
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 242 score: 0.8598
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 243 score: 0.7972
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 244 score: 0.9161
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 245 score: 0.8532
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 246 score: 0.7740
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 247 score: 0.7932
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 248 score: 0.8416
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 249 score: 0.8956
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 250 score: 0.9056
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 251 score: 0.9475
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 252 score: 0.9450
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 253 score: 0.9082
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 254 score: 0.9543
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 255 score: 0.9265
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 256 score: 0.9071
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 257 score: 0.9327
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 258 score: 0.8736
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 259 score: 0.8302
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 260 score: 0.9263
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 261 score: 0.8255
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 262 score: 0.9189
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 263 score: 0.8876
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 264 score: 0.9256
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 265 score: 0.8977
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 266 score: 0.8909
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 267 score: 0.8463
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 268 score: 0.9254
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 269 score: 0.9017
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 270 score: 0.9106
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 271 score: 0.8527
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 272 score: 0.8019
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 273 score: 0.9285
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 274 score: 0.7803
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 275 score: 0.8267
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 276 score: 0.8334
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 277 score: 0.9496
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 278 score: 0.8536
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 279 score: 0.9539
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 280 score: 0.9227
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 281 score: 0.8877
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 282 score: 0.9633
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 283 score: 0.9278
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 284 score: 0.9112
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 285 score: 0.9386
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 286 score: 0.8743
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 287 score: 0.8603
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 288 score: 0.9326
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 289 score: 0.9113
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 290 score: 0.8687
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 291 score: 0.8619
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 292 score: 0.9401
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 293 score: 0.9232
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 294 score: 0.8285
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 295 score: 0.9002
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 296 score: 0.8581
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 297 score: 0.9316
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 298 score: 0.9185
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 299 score: 0.9062
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 300 score: 0.8876
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 301 score: 0.8439
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 302 score: 0.9257
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 303 score: 0.9465
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 304 score: 0.9205
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 305 score: 0.9438
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 306 score: 0.8816
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 307 score: 0.9069
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 308 score: 0.9296
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 309 score: 0.8298
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 310 score: 0.9771
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 311 score: 0.9581
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 312 score: 0.9517
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 313 score: 0.7834
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 314 score: 0.9436
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 315 score: 0.8991
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 316 score: 0.8834
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 317 score: 0.8889
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 318 score: 0.8575
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 319 score: 0.9529
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 320 score: 0.8577
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 321 score: 0.8155
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 322 score: 0.7312
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 323 score: 0.9195
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 324 score: 0.9130
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 325 score: 0.9226
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 326 score: 0.8735
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 327 score: 0.8972
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 328 score: 0.9304
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 329 score: 0.7929
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 330 score: 0.9178
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 331 score: 0.9509
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 332 score: 0.9461
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 333 score: 0.7810
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 334 score: 0.9417
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 335 score: 0.9050
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 336 score: 0.9215
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 337 score: 0.8726
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 338 score: 0.8939
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 339 score: 0.9190
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 340 score: 0.8399
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 341 score: 0.8841
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 342 score: 0.7819
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 343 score: 0.8525
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 344 score: 0.9245
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 345 score: 0.8561
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 346 score: 0.9545
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 347 score: 0.9420
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 348 score: 0.8514
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 349 score: 0.8138
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 350 score: 0.9000
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 351 score: 0.9170
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 352 score: 0.8409
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 353 score: 0.9547
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 354 score: 0.9170
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 355 score: 0.9335
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 356 score: 0.9286
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 357 score: 0.9591
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 358 score: 0.8524
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 359 score: 0.8758
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 360 score: 0.8742
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 361 score: 0.8485
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 362 score: 0.8280
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 363 score: 0.7862
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 364 score: 0.9001
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 365 score: 0.8606
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 366 score: 0.8878
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 367 score: 0.9306
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 368 score: 0.8553
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 369 score: 0.8461
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 370 score: 0.6947
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 371 score: 0.7303
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 372 score: 0.8331
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 373 score: 0.8260
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 374 score: 0.9615
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 375 score: 0.9045
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 376 score: 0.9507
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 377 score: 0.9549
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 378 score: 0.8526
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 379 score: 0.8842
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 380 score: 0.8900
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 381 score: 0.7956
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 382 score: 0.8223
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 383 score: 0.8850
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 384 score: 0.9015
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 385 score: 0.8454
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 386 score: 0.8735
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 387 score: 0.8351
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 388 score: 0.9298
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 389 score: 0.8872
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 390 score: 0.9407
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 391 score: 0.9387
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 392 score: 0.9255
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 393 score: 0.9780
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 394 score: 0.9794
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 395 score: 0.9464
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 396 score: 0.7519
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 397 score: 0.9303
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 398 score: 0.8406
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 399 score: 0.9189
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 400 score: 0.9359
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 401 score: 0.8488
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 402 score: 0.9167
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 403 score: 0.8034
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 404 score: 0.8585
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 405 score: 0.8564
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 406 score: 0.9170
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 407 score: 0.9257
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 408 score: 0.9534
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 409 score: 0.8839
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 410 score: 0.9485
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 411 score: 0.8969
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 412 score: 0.8988
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 413 score: 0.9304
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 414 score: 0.9169
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 415 score: 0.8905
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 416 score: 0.8573
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 417 score: 0.8945
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 418 score: 0.8903
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 419 score: 0.9483
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 420 score: 0.9630
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 421 score: 0.9410
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 422 score: 0.9067
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 423 score: 0.7947
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 424 score: 0.9090
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 425 score: 0.9348
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 426 score: 0.9402
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 427 score: 0.9404
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 428 score: 0.9225
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 429 score: 0.9206
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 430 score: 0.8926
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 431 score: 0.8069
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 432 score: 0.8815
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 433 score: 0.6917
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 434 score: 0.8793
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 435 score: 0.7780
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 436 score: 0.8733
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 437 score: 0.9390
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 438 score: 0.9454
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 439 score: 0.8375
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 440 score: 0.9280
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 441 score: 0.9247
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 442 score: 0.9566
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 443 score: 0.8962
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 444 score: 0.8855
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 445 score: 0.8797
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 446 score: 0.9486
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 447 score: 0.9499
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 448 score: 0.9499
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 449 score: 0.8371
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 450 score: 0.9278
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 451 score: 0.8736
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 452 score: 0.9638
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 453 score: 0.9099
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 454 score: 0.9429
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 455 score: 0.8787
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 456 score: 0.7539
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 457 score: 0.9494
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 458 score: 0.9357
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 459 score: 0.8798
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 460 score: 0.9508
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 461 score: 0.8804
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 462 score: 0.8930
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 463 score: 0.9306
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 464 score: 0.9131
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 465 score: 0.8887
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 466 score: 0.9304
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 467 score: 0.6240
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 468 score: 0.8048
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 469 score: 0.7914
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 470 score: 0.5864
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 471 score: 0.8282
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 472 score: 0.8996
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 473 score: 0.8835
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 474 score: 0.7582
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 475 score: 0.8994
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 476 score: 0.8838
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 477 score: 0.9414
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 478 score: 0.9486
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 479 score: 0.8995
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 480 score: 0.9274
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 481 score: 0.8505
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 482 score: 0.9016
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 483 score: 0.9065
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 484 score: 0.8918
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 485 score: 0.8779
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 486 score: 0.9652
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 487 score: 0.8513
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 488 score: 0.9704
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 489 score: 0.9413
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 490 score: 0.9155
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 491 score: 0.9408
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 492 score: 0.8858
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 493 score: 0.9340
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 494 score: 0.9000
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 495 score: 0.8776
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 496 score: 0.9390
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 497 score: 0.9122
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 498 score: 0.9461
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 499 score: 0.9309
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 500 score: 0.9566
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 501 score: 0.9650
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 502 score: 0.9115
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 503 score: 0.8817
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 504 score: 0.8722
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 505 score: 0.8641
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 506 score: 0.7481
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 507 score: 0.8541
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 508 score: 0.8780
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 509 score: 0.8499
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 510 score: 0.7196
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 511 score: 0.8623
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 512 score: 0.8830
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 513 score: 0.8972
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 514 score: 0.9382
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 515 score: 0.8585
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 516 score: 0.8406
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 517 score: 0.9330
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 518 score: 0.9294
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 519 score: 0.9524
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 520 score: 0.8862
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 521 score: 0.9533
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 522 score: 0.8962
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 523 score: 0.8658
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 524 score: 0.9392
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 525 score: 0.9351
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 526 score: 0.8959
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 527 score: 0.8890
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 528 score: 0.9083
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 529 score: 0.8680
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 530 score: 0.8537
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 531 score: 0.9062
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 532 score: 0.8642
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 533 score: 0.8953
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 534 score: 0.8552
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 535 score: 0.7794
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 536 score: 0.8710
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 537 score: 0.8853
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 538 score: 0.9474
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 539 score: 0.9077
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 540 score: 0.9041
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 541 score: 0.9367
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 542 score: 0.8949
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 543 score: 0.8937
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 544 score: 0.9024
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 545 score: 0.9419
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 546 score: 0.7002
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 547 score: 0.8649
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 548 score: 0.8557
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 549 score: 0.9359
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 550 score: 0.8051
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 551 score: 0.9266
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 552 score: 0.8753
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 553 score: 0.9417
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 554 score: 0.8325
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 555 score: 0.8820
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 556 score: 0.8570
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 557 score: 0.8387
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 558 score: 0.7722
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 559 score: 0.8022
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 560 score: 0.9614
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 561 score: 0.9015
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 562 score: 0.8549
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 563 score: 0.7875
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 564 score: 0.7468
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 565 score: 0.9339
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 566 score: 0.9108
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 567 score: 0.9268
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 568 score: 0.8262
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 569 score: 0.7548
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 570 score: 0.9293
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 571 score: 0.8911
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 572 score: 0.8170
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 573 score: 0.9089
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 574 score: 0.9595
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 575 score: 0.6767
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 576 score: 0.9026
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 577 score: 0.9370
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 578 score: 0.9317
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 579 score: 0.9167
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 580 score: 0.8816
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 581 score: 0.9216
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 582 score: 0.8319
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 583 score: 0.7679
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 584 score: 0.8001
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 585 score: 0.8978
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 586 score: 0.8709
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 587 score: 0.9196
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 588 score: 0.8752
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 589 score: 0.8730
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 590 score: 0.9291
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 591 score: 0.9379
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 592 score: 0.8322
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 593 score: 0.9491
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 594 score: 0.8843
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 595 score: 0.8420
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 596 score: 0.9015
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 597 score: 0.8902
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 598 score: 0.8657
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 599 score: 0.9221
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 600 score: 0.9324
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 601 score: 0.8746
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 602 score: 0.9514
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 603 score: 0.9351
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 604 score: 0.9213
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 605 score: 0.9211
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 606 score: 0.8689
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 607 score: 0.7415
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 608 score: 0.9207
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 609 score: 0.8559
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 610 score: 0.9384
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 611 score: 0.9279
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 612 score: 0.9109
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 613 score: 0.9089
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 614 score: 0.9308
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 615 score: 0.9514
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 616 score: 0.9547
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 617 score: 0.9507
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 618 score: 0.9102
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 619 score: 0.8906
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 620 score: 0.9367
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 621 score: 0.7884
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 622 score: 0.9365
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 623 score: 0.9205
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 624 score: 0.8842
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 625 score: 0.8864
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 626 score: 0.9351
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 627 score: 0.9501
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 628 score: 0.9523
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 629 score: 0.9240
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 630 score: 0.8842
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 631 score: 0.9220
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 632 score: 0.9508
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 633 score: 0.9596
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 634 score: 0.9686
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 635 score: 0.9300
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 636 score: 0.9240
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 637 score: 0.9173
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 638 score: 0.9209
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 639 score: 0.9507
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 640 score: 0.9227
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 641 score: 0.9435
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 642 score: 0.9295
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 643 score: 0.9221
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 644 score: 0.8277
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 645 score: 0.8122
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 646 score: 0.8070
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 647 score: 0.8849
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 648 score: 0.8845
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 649 score: 0.9036
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 650 score: 0.9521
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 651 score: 0.8501
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 652 score: 0.6671
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 653 score: 0.8867
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 654 score: 0.8024
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 655 score: 0.9264
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 656 score: 0.8977
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 657 score: 0.9464
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 658 score: 0.7447
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 659 score: 0.8926
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 660 score: 0.8327
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 661 score: 0.9137
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 662 score: 0.9277
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 663 score: 0.9161
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 664 score: 0.9079
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 665 score: 0.9107
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 666 score: 0.9222
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 667 score: 0.8792
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 668 score: 0.9025
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 669 score: 0.9168
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 670 score: 0.9048
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 671 score: 0.9305
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 672 score: 0.9180
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 673 score: 0.9143
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 674 score: 0.9129
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 675 score: 0.9384
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 676 score: 0.9359
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 677 score: 0.9231
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 678 score: 0.9195
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 679 score: 0.9484
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 680 score: 0.9098
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 681 score: 0.9638
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 682 score: 0.8963
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 683 score: 0.8784
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 684 score: 0.8736
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 685 score: 0.9258
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 686 score: 0.8865
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 687 score: 0.8678
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 688 score: 0.9111
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 689 score: 0.9135
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 690 score: 0.9101
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 691 score: 0.8970
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 692 score: 0.9223
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 693 score: 0.8214
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 694 score: 0.7396
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 695 score: 0.9233
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 696 score: 0.8968
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 697 score: 0.8739
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 698 score: 0.9296
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 699 score: 0.9513
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 700 score: 0.8924
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 701 score: 0.9377
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 702 score: 0.9610
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 703 score: 0.8559
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 704 score: 0.9278
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 705 score: 0.9212
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 706 score: 0.8366
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 707 score: 0.9231
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 708 score: 0.9318
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 709 score: 0.9281
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 710 score: 0.9179
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 711 score: 0.8545
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 712 score: 0.9497
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 713 score: 0.9287
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 714 score: 0.9222
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 715 score: 0.9040
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 716 score: 0.8659
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 717 score: 0.9095
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 718 score: 0.9228
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 719 score: 0.8381
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 720 score: 0.8811
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 721 score: 0.9155
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 722 score: 0.8615
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 723 score: 0.9200
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 724 score: 0.9400
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 725 score: 0.9058
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 726 score: 0.8875
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 727 score: 0.9211
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 728 score: 0.8143
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 729 score: 0.8667
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 730 score: 0.9390
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 731 score: 0.9094
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 732 score: 0.8937
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 733 score: 0.9428
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 734 score: 0.8163
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 735 score: 0.8592
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 736 score: 0.8824
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 737 score: 0.8713
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 738 score: 0.9449
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 739 score: 0.8912
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 740 score: 0.9528
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 741 score: 0.8371
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 742 score: 0.8888
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 743 score: 0.9189
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 744 score: 0.8662
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 745 score: 0.9459
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 746 score: 0.8803
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 747 score: 0.9232
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 748 score: 0.9676
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 749 score: 0.8872
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 750 score: 0.9483
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 751 score: 0.9681
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 752 score: 0.9720
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 753 score: 0.9255
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 754 score: 0.8768
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 755 score: 0.9307
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 756 score: 0.9138
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 757 score: 0.8846
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 758 score: 0.9074
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 759 score: 0.9335
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 760 score: 0.9549
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 761 score: 0.9066
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 762 score: 0.9306
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 763 score: 0.8805
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 764 score: 0.8892
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 765 score: 0.8361
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 766 score: 0.9226
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 767 score: 0.9292
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 768 score: 0.9472
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 769 score: 0.9658
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 770 score: 0.9163
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 771 score: 0.9171
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 772 score: 0.9298
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 773 score: 0.9048
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 774 score: 0.8749
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 775 score: 0.8615
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 776 score: 0.8153
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 777 score: 0.9160
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 778 score: 0.9310
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 779 score: 0.7914
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 780 score: 0.8762
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 781 score: 0.8978
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 782 score: 0.9418
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 783 score: 0.8853
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 784 score: 0.8791
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 785 score: 0.7964
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 786 score: 0.9077
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 787 score: 0.9222
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 788 score: 0.9384
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 789 score: 0.9010
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 790 score: 0.9301
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 791 score: 0.9114
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 792 score: 0.8822
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 793 score: 0.8790
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 794 score: 0.9033
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 795 score: 0.8974
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 796 score: 0.9755
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 797 score: 0.8660
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 798 score: 0.9364
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 799 score: 0.8187
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 800 score: 0.8167
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 801 score: 0.8094
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 802 score: 0.8972
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 803 score: 0.9332
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 804 score: 0.8282
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 805 score: 0.9009
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 806 score: 0.9537
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 807 score: 0.8293
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 808 score: 0.9271
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 809 score: 0.8601
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 810 score: 0.9353
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 811 score: 0.8297
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 812 score: 0.9168
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 813 score: 0.9384
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 814 score: 0.9273
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 815 score: 0.8803
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 816 score: 0.8762
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 817 score: 0.8554
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 818 score: 0.8085
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 819 score: 0.9210
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 820 score: 0.9568
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 821 score: 0.9581
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 822 score: 0.8565
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 823 score: 0.9214
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 824 score: 0.9451
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 825 score: 0.9142
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 826 score: 0.8497
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 827 score: 0.9225
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 828 score: 0.9116
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 829 score: 0.8735
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 830 score: 0.8835
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 831 score: 0.8584
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 832 score: 0.8751
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 833 score: 0.8109
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 834 score: 0.8497
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 835 score: 0.7924
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 836 score: 0.8994
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 837 score: 0.9244
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 838 score: 0.9309
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 839 score: 0.9068
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 840 score: 0.9144
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 841 score: 0.8501
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 842 score: 0.7824
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 843 score: 0.8852
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 844 score: 0.8362
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 845 score: 0.8574
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 846 score: 0.7137
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 847 score: 0.8224
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 848 score: 0.6809
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 849 score: 0.7345
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 850 score: 0.8717
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 851 score: 0.9266
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 852 score: 0.9064
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 853 score: 0.7465
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 854 score: 0.8664
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 855 score: 0.9311
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 856 score: 0.8696
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 857 score: 0.9351
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 858 score: 0.9056
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 859 score: 0.8635
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 860 score: 0.8832
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 861 score: 0.8834
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 862 score: 0.9543
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 863 score: 0.9444
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 864 score: 0.8942
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 865 score: 0.8698
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 866 score: 0.9155
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 867 score: 0.9044
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 868 score: 0.9072
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 869 score: 0.7579
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 870 score: 0.9403
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 871 score: 0.8945
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 872 score: 0.9212
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 873 score: 0.9335
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 874 score: 0.9015
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 875 score: 0.9043
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 876 score: 0.8290
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 877 score: 0.9054
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 878 score: 0.9391
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 879 score: 0.9095
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 880 score: 0.9224
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 881 score: 0.9132
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 882 score: 0.9439
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 883 score: 0.9016
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 884 score: 0.8486
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 885 score: 0.8952
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 886 score: 0.9469
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 887 score: 0.7436
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 888 score: 0.7140
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 889 score: 0.9141
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 890 score: 0.9031
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 891 score: 0.9234
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 892 score: 0.7952
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 893 score: 0.8623
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 894 score: 0.9019
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 895 score: 0.8794
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 896 score: 0.9566
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 897 score: 0.8330
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 898 score: 0.9099
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 899 score: 0.8970
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 900 score: 0.9047
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 901 score: 0.8130
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 902 score: 0.9385
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 903 score: 0.8875
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 904 score: 0.8880
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 905 score: 0.9079
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 906 score: 0.8867
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 907 score: 0.8567
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 908 score: 0.8972
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 909 score: 0.9626
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 910 score: 0.9037
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 911 score: 0.9062
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 912 score: 0.8986
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 913 score: 0.9661
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 914 score: 0.8757
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 915 score: 0.8771
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 916 score: 0.9718
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 917 score: 0.8727
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 918 score: 0.9695
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 919 score: 0.9195
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 920 score: 0.8983
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 921 score: 0.8811
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 922 score: 0.9133
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 923 score: 0.9232
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 924 score: 0.8464
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 925 score: 0.9153
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 926 score: 0.9166
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 927 score: 0.8735
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 928 score: 0.9304
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 929 score: 0.8638
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 930 score: 0.9428
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 931 score: 0.8908
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 932 score: 0.8039
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 933 score: 0.8599
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 934 score: 0.8922
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 935 score: 0.8819
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 936 score: 0.9063
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 937 score: 0.9480
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 938 score: 0.9560
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 939 score: 0.9403
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 940 score: 0.9079
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 941 score: 0.9563
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 942 score: 0.9322
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 943 score: 0.8946
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 944 score: 0.7936
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 945 score: 0.9535
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 946 score: 0.8160
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 947 score: 0.9260
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 948 score: 0.8773
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 949 score: 0.8779
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 950 score: 0.8884
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 951 score: 0.9011
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 952 score: 0.8497
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 953 score: 0.9239
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 954 score: 0.7207
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 955 score: 0.9370
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 956 score: 0.8689
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 957 score: 0.9471
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 958 score: 0.9191
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 959 score: 0.9064
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 960 score: 0.8695
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 961 score: 0.8520
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 962 score: 0.9093
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 963 score: 0.9067
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 964 score: 0.9462
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 965 score: 0.8538
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 966 score: 0.9087
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 967 score: 0.8160
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 968 score: 0.6846
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 969 score: 0.7425
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 970 score: 0.8995
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 971 score: 0.9082
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 972 score: 0.9102
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 973 score: 0.9654
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 974 score: 0.8911
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 975 score: 0.9460
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 976 score: 0.9190
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 977 score: 0.8546
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 978 score: 0.9552
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 979 score: 0.8969
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 980 score: 0.8406
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 981 score: 0.9039
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 982 score: 0.9077
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 983 score: 0.8346
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 984 score: 0.9431
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 985 score: 0.9477
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 986 score: 0.8925
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 987 score: 0.8837
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 988 score: 0.8281
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 989 score: 0.8817
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 990 score: 0.8952
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 991 score: 0.8703
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 992 score: 0.9290
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 993 score: 0.8895
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 994 score: 0.7704
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 995 score: 0.8913
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 996 score: 0.9782
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 997 score: 0.9613
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 998 score: 0.9030
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 999 score: 0.9302
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 1000 score: 0.9440
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 1001 score: 0.8439
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 1002 score: 0.8681
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 1003 score: 0.8297
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 1004 score: 0.9447
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 1005 score: 0.9006
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 1006 score: 0.8306
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 1007 score: 0.8974
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 1008 score: 0.9027
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 1009 score: 0.8894
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 1010 score: 0.9322
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt Segment 1011 score: 0.8865
/beacon-scratch/tongzh24/XALMA-checkpoint/exp_50_languages/seperate_training/xalma-13b-sft-50-languages-pt-max-tokens-512/test-en-pt score: 0.8921