diff --git "a/results.json" "b/results.json" --- "a/results.json" +++ "b/results.json" @@ -34272,21844 +34272,33170 @@ "score":0.567169258 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"aeb", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"aeb", "task":"translation_from", "metric":"bleu", - "score":0.3519233265 + "score":0.342116281 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"aeb", "task":"translation_from", "metric":"chrf", - "score":0.5745897235 + "score":0.559017125 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"aeb", "task":"translation_to", "metric":"bleu", - "score":0.2759791384 + "score":0.2612038772 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"aeb", "task":"translation_to", "metric":"chrf", - "score":0.4854942304 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"af", - "task":"classification", - "metric":"accuracy", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"af", - "task":"translation_from", - "metric":"bleu", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"af", - "task":"translation_from", - "metric":"chrf", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"af", - "task":"translation_to", - "metric":"bleu", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"af", - "task":"translation_to", - "metric":"chrf", - "score":0.0 + "score":0.4610162591 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ak", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ak", "task":"mgsm", "metric":"accuracy", - "score":0.4 + "score":0.5 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ak", "task":"mmlu", "metric":"accuracy", "score":0.7 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ak", "task":"translation_from", "metric":"bleu", - "score":0.2615212462 + "score":0.2362598693 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ak", "task":"translation_from", "metric":"chrf", - "score":0.4896634905 + "score":0.4567970323 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ak", "task":"translation_to", "metric":"bleu", - "score":0.1667049515 + "score":0.1787109448 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ak", "task":"translation_to", "metric":"chrf", - "score":0.4295949613 + "score":0.4308196228 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"am", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"am", "task":"mgsm", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"am", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"am", "task":"translation_from", "metric":"bleu", - "score":0.339375511 + "score":0.2883756135 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"am", "task":"translation_from", "metric":"chrf", - "score":0.566407043 + "score":0.5452929372 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"am", "task":"translation_to", "metric":"bleu", - "score":0.2692320655 + "score":0.2563045907 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"am", "task":"translation_to", "metric":"chrf", - "score":0.3685144367 + "score":0.3587997566 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"apc", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"apc", "task":"translation_from", "metric":"bleu", - "score":0.3872368514 + "score":0.3529391424 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"apc", "task":"translation_from", "metric":"chrf", - "score":0.6253206413 + "score":0.6061230642 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"apc", "task":"translation_to", "metric":"bleu", - "score":0.3385588073 + "score":0.3735935027 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"apc", "task":"translation_to", "metric":"chrf", - "score":0.5846751763 + "score":0.6118752881 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ar", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ar", "task":"mmlu", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.3462011916 + "score":0.321926202 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.5813984303 + "score":0.5672345783 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ar", "task":"translation_to", "metric":"bleu", - "score":0.4319399394 + "score":0.3971969927 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ar", "task":"translation_to", "metric":"chrf", - "score":0.6269389132 + "score":0.5997335085 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ary", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ary", "task":"translation_from", "metric":"bleu", - "score":0.2181205299 + "score":0.178647434 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ary", "task":"translation_from", "metric":"chrf", - "score":0.4844955734 + "score":0.459184816 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ary", "task":"translation_to", "metric":"bleu", - "score":0.2033199109 + "score":0.1766325657 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ary", "task":"translation_to", "metric":"chrf", - "score":0.4375696019 + "score":0.42829263 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"arz", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"arz", "task":"translation_from", "metric":"bleu", - "score":0.2639599801 + "score":0.2689181562 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"arz", "task":"translation_from", "metric":"chrf", - "score":0.4789807253 + "score":0.5103302194 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"arz", "task":"translation_to", "metric":"bleu", - "score":0.2907084686 + "score":0.2712387895 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"arz", "task":"translation_to", "metric":"chrf", - "score":0.4882539682 + "score":0.4721454199 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"as", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"as", "task":"translation_from", "metric":"bleu", - "score":0.3118761994 + "score":0.302725237 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"as", "task":"translation_from", "metric":"chrf", - "score":0.5439623542 + "score":0.542445303 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"as", "task":"translation_to", "metric":"bleu", - "score":0.243905252 + "score":0.2074435657 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"as", "task":"translation_to", "metric":"chrf", - "score":0.4730608179 + "score":0.4358785934 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"awa", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"awa", "task":"translation_from", "metric":"bleu", - "score":0.40510024 + "score":0.3306584572 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"awa", "task":"translation_from", "metric":"chrf", - "score":0.6210515689 + "score":0.5470737398 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"awa", "task":"translation_to", "metric":"bleu", - "score":0.2510210672 + "score":0.1839015438 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"awa", "task":"translation_to", "metric":"chrf", - "score":0.4814090379 + "score":0.3995221223 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"az", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"az", "task":"translation_from", "metric":"bleu", - "score":0.3101513593 + "score":0.2402619776 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"az", "task":"translation_from", "metric":"chrf", - "score":0.5253923906 + "score":0.4816842061 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"az", "task":"translation_to", "metric":"bleu", - "score":0.216177525 + "score":0.2017479595 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"az", "task":"translation_to", "metric":"chrf", - "score":0.4555999734 + "score":0.4438028104 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"be", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"be", "task":"translation_from", "metric":"bleu", - "score":0.2142226733 + "score":0.1964434077 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"be", "task":"translation_from", "metric":"chrf", - "score":0.5048792464 + "score":0.4658109118 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"be", "task":"translation_to", "metric":"bleu", - "score":0.3216771298 + "score":0.3578761246 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"be", "task":"translation_to", "metric":"chrf", - "score":0.5056511666 + "score":0.5250650323 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"bho", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"bho", "task":"translation_from", "metric":"bleu", - "score":0.3246124272 + "score":0.3118354834 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"bho", "task":"translation_from", "metric":"chrf", - "score":0.5547058357 + "score":0.5301057957 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"bho", "task":"translation_to", "metric":"bleu", - "score":0.2300858071 + "score":0.2712094702 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"bho", "task":"translation_to", "metric":"chrf", - "score":0.4391471287 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bm", - "task":"classification", - "metric":"accuracy", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bm", - "task":"translation_from", - "metric":"bleu", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bm", - "task":"translation_from", - "metric":"chrf", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bm", - "task":"translation_to", - "metric":"bleu", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"bm", - "task":"translation_to", - "metric":"chrf", - "score":0.0 + "score":0.4554148161 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"bn", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"bn", "task":"mgsm", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"bn", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.3332105938 + "score":0.3106246769 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.5788748413 + "score":0.5720599098 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"bn", "task":"translation_to", "metric":"bleu", - "score":0.3925309816 + "score":0.3532786899 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"bn", "task":"translation_to", "metric":"chrf", - "score":0.5671456285 + "score":0.5492979392 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ca", + "model":"google\/gemini-2.5-flash", + "bcp_47":"ceb", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ca", - "task":"translation_from", - "metric":"bleu", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ca", - "task":"translation_from", - "metric":"chrf", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ca", - "task":"translation_to", - "metric":"bleu", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ca", - "task":"translation_to", - "metric":"chrf", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ceb", - "task":"classification", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ceb", "task":"translation_from", "metric":"bleu", - "score":0.4667759574 + "score":0.4167458111 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ceb", "task":"translation_from", "metric":"chrf", - "score":0.6329355142 + "score":0.6414773714 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ceb", "task":"translation_to", "metric":"bleu", - "score":0.4086791428 + "score":0.4574369641 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ceb", "task":"translation_to", "metric":"chrf", - "score":0.6523845508 + "score":0.6642298649 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ckb", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ckb", "task":"translation_from", "metric":"bleu", - "score":0.3593703137 + "score":0.3171272191 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ckb", "task":"translation_from", "metric":"chrf", - "score":0.6131084436 + "score":0.5378911972 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ckb", "task":"translation_to", "metric":"bleu", - "score":0.349617489 + "score":0.3576320675 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ckb", "task":"translation_to", "metric":"chrf", - "score":0.5888504157 + "score":0.5996552124 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"cs", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"cs", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.7 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"cs", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"cs", "task":"translation_from", "metric":"bleu", - "score":0.4190817149 + "score":0.3763167038 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"cs", "task":"translation_from", "metric":"chrf", - "score":0.633614654 + "score":0.6069984198 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"cs", "task":"translation_to", "metric":"bleu", - "score":0.3332466044 + "score":0.412011399 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"cs", "task":"translation_to", "metric":"chrf", - "score":0.5272130276 + "score":0.5948875971 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"de", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"de", "task":"mgsm", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"de", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.4080538745 + "score":0.4097540667 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.6278026445 + "score":0.627572506 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"de", "task":"translation_to", "metric":"bleu", - "score":0.4940498755 + "score":0.5159030608 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"de", "task":"translation_to", "metric":"chrf", - "score":0.6915113583 + "score":0.6896498523 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"el", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"el", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"el", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"el", "task":"translation_from", "metric":"bleu", - "score":0.3680077775 + "score":0.3297475202 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"el", "task":"translation_from", "metric":"chrf", - "score":0.5798463116 + "score":0.5587828835 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"el", "task":"translation_to", "metric":"bleu", - "score":0.4003636095 + "score":0.3865296224 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"el", "task":"translation_to", "metric":"chrf", - "score":0.5747287276 + "score":0.5630460332 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"en", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"en", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"en", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.5780592594 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.727062887 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"en", "task":"translation_to", "metric":"bleu", - "score":0.725042796 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"en", "task":"translation_to", "metric":"chrf", - "score":0.868453404 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"es", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"es", "task":"mgsm", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"es", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.3228577771 + "score":0.3392082462 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.5691176688 + "score":0.572145108 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"es", "task":"translation_to", "metric":"bleu", - "score":0.4211069488 + "score":0.3956672126 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"es", "task":"translation_to", "metric":"chrf", - "score":0.6329026504 + "score":0.6257285571 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"fa", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"fa", "task":"mmlu", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"fa", "task":"translation_from", "metric":"bleu", - "score":0.3659700454 + "score":0.3764428485 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"fa", "task":"translation_from", "metric":"chrf", - "score":0.5807664259 + "score":0.5794911256 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"fa", "task":"translation_to", "metric":"bleu", - "score":0.2252471667 + "score":0.3019679958 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"fa", "task":"translation_to", "metric":"chrf", - "score":0.4480100347 + "score":0.5294391762 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"fil", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"fil", "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"fil", "task":"translation_from", "metric":"bleu", - "score":0.447799796 + "score":0.3967317865 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"fil", "task":"translation_from", "metric":"chrf", - "score":0.6437494805 + "score":0.6195138455 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"fil", "task":"translation_to", "metric":"bleu", - "score":0.318387966 + "score":0.3512547173 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"fil", "task":"translation_to", "metric":"chrf", - "score":0.6173467767 + "score":0.6404359092 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"fr", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"fr", "task":"mgsm", "metric":"accuracy", "score":0.7 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"fr", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.3683003934 + "score":0.3566291662 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.5961800274 + "score":0.5901709379 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"fr", "task":"translation_to", "metric":"bleu", - "score":0.5899042948 + "score":0.5810870953 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"fr", "task":"translation_to", "metric":"chrf", - "score":0.7506595836 + "score":0.7402195597 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"fuv", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"fuv", "task":"translation_from", "metric":"bleu", - "score":0.0858271085 + "score":0.0654195918 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"fuv", "task":"translation_from", "metric":"chrf", - "score":0.2495672773 + "score":0.2431272498 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"fuv", "task":"translation_to", "metric":"bleu", - "score":0.0320352537 + "score":0.0469027058 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"fuv", "task":"translation_to", "metric":"chrf", - "score":0.2006317654 + "score":0.2599881115 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"gu", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"gu", "task":"translation_from", "metric":"bleu", - "score":0.3793081536 + "score":0.3528703899 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"gu", "task":"translation_from", "metric":"chrf", - "score":0.5865031052 + "score":0.5605109395 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"gu", "task":"translation_to", "metric":"bleu", - "score":0.2344717249 + "score":0.180119873 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"gu", "task":"translation_to", "metric":"chrf", - "score":0.4873543825 + "score":0.4654772276 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ha", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ha", "task":"mgsm", "metric":"accuracy", - "score":0.5 + "score":0.6 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ha", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ha", "task":"translation_from", "metric":"bleu", - "score":0.3157236901 + "score":0.2852268084 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ha", "task":"translation_from", "metric":"chrf", - "score":0.5365403784 + "score":0.4820918601 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ha", "task":"translation_to", "metric":"bleu", - "score":0.3221592053 + "score":0.3191497109 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ha", "task":"translation_to", "metric":"chrf", - "score":0.565816945 + "score":0.5714009602 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"hi", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.5 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"hi", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.2 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.4661333335 + "score":0.0284513224 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.6599650679 + "score":0.1002460472 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"hi", "task":"translation_to", "metric":"bleu", - "score":0.4319599559 + "score":0.139929051 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"hi", "task":"translation_to", "metric":"chrf", - "score":0.6493733048 + "score":0.2620347708 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"hne", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"hne", "task":"translation_from", "metric":"bleu", - "score":0.3345560794 + "score":0.336133928 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"hne", "task":"translation_from", "metric":"chrf", - "score":0.5782385873 + "score":0.545638091 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"hne", "task":"translation_to", "metric":"bleu", - "score":0.1623642047 + "score":0.1683321583 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"hne", "task":"translation_to", "metric":"chrf", - "score":0.4427298342 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ht", - "task":"classification", - "metric":"accuracy", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ht", - "task":"translation_from", - "metric":"bleu", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ht", - "task":"translation_from", - "metric":"chrf", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ht", - "task":"translation_to", - "metric":"bleu", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ht", - "task":"translation_to", - "metric":"chrf", - "score":0.0 + "score":0.4261207547 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"hu", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"hu", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"hu", "task":"translation_from", "metric":"bleu", - "score":0.3210417538 + "score":0.3151646581 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"hu", "task":"translation_from", "metric":"chrf", - "score":0.5852315407 + "score":0.5599039863 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"hu", "task":"translation_to", "metric":"bleu", - "score":0.4603569586 + "score":0.4642022823 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"hu", "task":"translation_to", "metric":"chrf", - "score":0.6610825918 + "score":0.6720003623 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"id", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"id", "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.3507436052 + "score":0.3580586993 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.5856872774 + "score":0.5973680765 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"id", "task":"translation_to", "metric":"bleu", - "score":0.387557065 + "score":0.466208483 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"id", "task":"translation_to", "metric":"chrf", - "score":0.6730969345 + "score":0.7131031141 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ig", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ig", "task":"mgsm", "metric":"accuracy", - "score":0.7 + "score":0.4 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ig", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ig", "task":"translation_from", "metric":"bleu", - "score":0.283991055 + "score":0.2779082008 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ig", "task":"translation_from", "metric":"chrf", - "score":0.5165825783 + "score":0.5108078595 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ig", "task":"translation_to", "metric":"bleu", - "score":0.297494689 + "score":0.2835120188 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ig", "task":"translation_to", "metric":"chrf", - "score":0.5366364022 + "score":0.5067796001 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ilo", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ilo", "task":"translation_from", "metric":"bleu", - "score":0.3679312463 + "score":0.2679844764 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ilo", "task":"translation_from", "metric":"chrf", - "score":0.5717815434 + "score":0.5037933164 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ilo", "task":"translation_to", "metric":"bleu", - "score":0.2293183432 + "score":0.243508886 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ilo", "task":"translation_to", "metric":"chrf", - "score":0.5172904845 + "score":0.5329216971 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"it", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"it", "task":"mgsm", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"it", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.7 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"it", "task":"translation_from", "metric":"bleu", - "score":0.3498261827 + "score":0.3211161163 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"it", "task":"translation_from", "metric":"chrf", - "score":0.5707332142 + "score":0.5700208797 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"it", "task":"translation_to", "metric":"bleu", - "score":0.35475083 + "score":0.3654943432 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"it", "task":"translation_to", "metric":"chrf", - "score":0.5942822113 + "score":0.5949572053 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ja", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ja", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ja", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.3590987818 + "score":0.3652971414 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.5958999814 + "score":0.605823173 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ja", "task":"translation_to", "metric":"bleu", - "score":0.4151803591 + "score":0.3680693686 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ja", "task":"translation_to", "metric":"chrf", - "score":0.5319028037 + "score":0.4700002965 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"jv", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.3793672083 + "score":0.3627331006 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.6054760312 + "score":0.5928422481 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"jv", "task":"translation_to", "metric":"bleu", - "score":0.3161702144 + "score":0.3781416178 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"jv", "task":"translation_to", "metric":"chrf", - "score":0.5956895972 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ki", - "task":"classification", - "metric":"accuracy", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ki", - "task":"translation_from", - "metric":"bleu", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ki", - "task":"translation_from", - "metric":"chrf", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ki", - "task":"translation_to", - "metric":"bleu", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ki", - "task":"translation_to", - "metric":"chrf", - "score":0.0 + "score":0.6275555619 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"kk", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"kk", "task":"translation_from", "metric":"bleu", - "score":0.2948023962 + "score":0.2553025069 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"kk", "task":"translation_from", "metric":"chrf", - "score":0.5499737045 + "score":0.5408614418 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"kk", "task":"translation_to", "metric":"bleu", - "score":0.3612978689 + "score":0.3062994849 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"kk", "task":"translation_to", "metric":"chrf", - "score":0.6021186725 + "score":0.58504635 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"km", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"km", "task":"translation_from", "metric":"bleu", - "score":0.3644204358 + "score":0.3700483899 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"km", "task":"translation_from", "metric":"chrf", - "score":0.5994539632 + "score":0.6006134318 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"km", "task":"translation_to", "metric":"bleu", - "score":0.2065208646 + "score":0.2315452529 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"km", "task":"translation_to", "metric":"chrf", - "score":0.4474063783 + "score":0.4617416997 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"kn", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"kn", "task":"translation_from", "metric":"bleu", - "score":0.3051972526 + "score":0.2885658633 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"kn", "task":"translation_from", "metric":"chrf", - "score":0.5542686332 + "score":0.5512502051 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"kn", "task":"translation_to", "metric":"bleu", - "score":0.3567486129 + "score":0.3602561303 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"kn", "task":"translation_to", "metric":"chrf", - "score":0.5611431734 + "score":0.5568929694 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ko", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ko", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ko", "task":"translation_from", "metric":"bleu", - "score":0.2872143997 + "score":0.2490831768 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ko", "task":"translation_from", "metric":"chrf", - "score":0.5525223441 + "score":0.5186737173 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ko", "task":"translation_to", "metric":"bleu", - "score":0.3116476133 + "score":0.2780296298 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ko", "task":"translation_to", "metric":"chrf", - "score":0.3648802199 + "score":0.3546301665 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"lua", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"lua", "task":"translation_from", "metric":"bleu", - "score":0.1399233592 + "score":0.0591613845 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"lua", "task":"translation_from", "metric":"chrf", - "score":0.315099285 + "score":0.2662007935 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"lua", "task":"translation_to", "metric":"bleu", - "score":0.0802015694 + "score":0.0779434955 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"lua", "task":"translation_to", "metric":"chrf", - "score":0.3631437635 + "score":0.3095367271 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"mag", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"mag", "task":"translation_from", "metric":"bleu", - "score":0.4128862434 + "score":0.3908377774 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"mag", "task":"translation_from", "metric":"chrf", - "score":0.6274466843 + "score":0.6260985434 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"mag", "task":"translation_to", "metric":"bleu", - "score":0.3688684574 + "score":0.3130016025 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"mag", "task":"translation_to", "metric":"chrf", - "score":0.5833102178 + "score":0.5391710538 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"mai", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"mai", "task":"translation_from", "metric":"bleu", - "score":0.3890840766 + "score":0.3471192 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"mai", "task":"translation_from", "metric":"chrf", - "score":0.6240476873 + "score":0.5771683143 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"mai", "task":"translation_to", "metric":"bleu", - "score":0.2256501556 + "score":0.2207082106 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"mai", "task":"translation_to", "metric":"chrf", - "score":0.4794729055 + "score":0.4870892013 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"mg", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"mg", "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"mg", "task":"translation_from", "metric":"bleu", - "score":0.3701671266 + "score":0.2993063676 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"mg", "task":"translation_from", "metric":"chrf", - "score":0.5789314386 + "score":0.5474937127 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"mg", "task":"translation_to", "metric":"bleu", - "score":0.2339248832 + "score":0.2153101678 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"mg", "task":"translation_to", "metric":"chrf", - "score":0.5444701317 + "score":0.5379094165 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ml", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ml", "task":"translation_from", "metric":"bleu", - "score":0.4065449181 + "score":0.3532448793 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ml", "task":"translation_from", "metric":"chrf", - "score":0.6069224309 + "score":0.5657281022 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ml", "task":"translation_to", "metric":"bleu", - "score":0.3084108149 + "score":0.2774888867 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ml", "task":"translation_to", "metric":"chrf", - "score":0.5610104654 + "score":0.5389145892 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"mr", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.2888720948 + "score":0.3233458031 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.5411662197 + "score":0.5703875576 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"mr", "task":"translation_to", "metric":"bleu", - "score":0.2820351359 + "score":0.2274584553 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"mr", "task":"translation_to", "metric":"chrf", - "score":0.5017455952 + "score":0.4665758709 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ms", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ms", "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ms", "task":"translation_from", "metric":"bleu", - "score":0.4137133794 + "score":0.3746934831 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ms", "task":"translation_from", "metric":"chrf", - "score":0.6312868188 + "score":0.6046609636 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ms", "task":"translation_to", "metric":"bleu", - "score":0.4812654706 + "score":0.4734156929 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ms", "task":"translation_to", "metric":"chrf", - "score":0.7314221816 + "score":0.7284733826 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"my", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"my", "task":"translation_from", "metric":"bleu", - "score":0.3696810103 + "score":0.3552781219 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"my", "task":"translation_from", "metric":"chrf", - "score":0.5941720939 + "score":0.5977013775 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"my", "task":"translation_to", "metric":"bleu", - "score":0.3374140159 + "score":0.3211140622 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"my", "task":"translation_to", "metric":"chrf", - "score":0.5598126987 + "score":0.544805929 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ne", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ne", "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ne", "task":"translation_from", "metric":"bleu", - "score":0.3690975587 + "score":0.3774439938 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ne", "task":"translation_from", "metric":"chrf", - "score":0.591186642 + "score":0.599804205 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ne", "task":"translation_to", "metric":"bleu", - "score":0.2727284255 + "score":0.2861323795 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ne", "task":"translation_to", "metric":"chrf", - "score":0.4816401296 + "score":0.5180107937 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"nl", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"nl", "task":"mgsm", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"nl", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"nl", "task":"translation_from", "metric":"bleu", - "score":0.3099744217 + "score":0.312116976 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"nl", "task":"translation_from", "metric":"chrf", - "score":0.5540665201 + "score":0.5463170004 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"nl", "task":"translation_to", "metric":"bleu", - "score":0.358350435 + "score":0.3780530389 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"nl", "task":"translation_to", "metric":"chrf", - "score":0.6375438913 + "score":0.6232733213 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ny", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ny", "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ny", "task":"translation_from", "metric":"bleu", - "score":0.2769742108 + "score":0.2177968416 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ny", "task":"translation_from", "metric":"chrf", - "score":0.5127880962 + "score":0.4415294523 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ny", "task":"translation_to", "metric":"bleu", - "score":0.1953053994 + "score":0.1367315108 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ny", "task":"translation_to", "metric":"chrf", - "score":0.5454095128 + "score":0.4585024296 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"om", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"om", "task":"mgsm", "metric":"accuracy", - "score":0.4 + "score":0.3 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"om", "task":"mmlu", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"om", "task":"translation_from", "metric":"bleu", - "score":0.1552982789 + "score":0.1871006972 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"om", "task":"translation_from", "metric":"chrf", - "score":0.4088650794 + "score":0.4365658925 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"om", "task":"translation_to", "metric":"bleu", - "score":0.0578542594 + "score":0.106229994 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"om", "task":"translation_to", "metric":"chrf", - "score":0.4227186624 + "score":0.4277182017 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"or", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"or", "task":"translation_from", "metric":"bleu", - "score":0.3491547876 + "score":0.3701266209 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"or", "task":"translation_from", "metric":"chrf", - "score":0.6003545703 + "score":0.6213278685 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"or", "task":"translation_to", "metric":"bleu", - "score":0.307748028 + "score":0.3031726243 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"or", "task":"translation_to", "metric":"chrf", - "score":0.5199829894 + "score":0.5214945108 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"pa", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.4833653569 + "score":0.4366998679 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.6877252787 + "score":0.657751239 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"pa", "task":"translation_to", "metric":"bleu", - "score":0.4959043786 + "score":0.4527636476 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"pa", "task":"translation_to", "metric":"chrf", - "score":0.631939007 + "score":0.6078708965 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"pl", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"pl", "task":"mgsm", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"pl", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"pl", "task":"translation_from", "metric":"bleu", - "score":0.345076722 + "score":0.3170527901 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"pl", "task":"translation_from", "metric":"chrf", - "score":0.5982949848 + "score":0.5593259189 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"pl", "task":"translation_to", "metric":"bleu", - "score":0.3888863333 + "score":0.381029585 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"pl", "task":"translation_to", "metric":"chrf", - "score":0.6077722316 + "score":0.5993345379 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"pt", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"pt", "task":"mmlu", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.4185968559 + "score":0.3912183043 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.6194298291 + "score":0.5915454866 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.5066913819 + "score":0.4626670594 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.7045563325 + "score":0.6755172019 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ro", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ro", "task":"mgsm", "metric":"accuracy", "score":0.7 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ro", "task":"mmlu", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ro", "task":"translation_from", "metric":"bleu", - "score":0.3510540475 + "score":0.3285564053 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ro", "task":"translation_from", "metric":"chrf", - "score":0.5985634799 + "score":0.5835489949 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ro", "task":"translation_to", "metric":"bleu", - "score":0.5670740367 + "score":0.5863602394 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ro", "task":"translation_to", "metric":"chrf", - "score":0.7258358589 + "score":0.7345305045 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ru", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ru", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ru", "task":"mmlu", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.2835606416 + "score":0.2800732142 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.5525332546 + "score":0.5572474453 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ru", "task":"translation_to", "metric":"bleu", - "score":0.5294387768 + "score":0.4692280866 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ru", "task":"translation_to", "metric":"chrf", - "score":0.6814959444 + "score":0.6613842883 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"rw", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"rw", "task":"mgsm", "metric":"accuracy", - "score":0.5 + "score":0.3 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"rw", "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"rw", "task":"translation_from", "metric":"bleu", - "score":0.315385923 + "score":0.2768738298 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"rw", "task":"translation_from", "metric":"chrf", - "score":0.5485214208 + "score":0.5136190092 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"rw", "task":"translation_to", "metric":"bleu", - "score":0.3039027455 + "score":0.2743310586 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"rw", "task":"translation_to", "metric":"chrf", - "score":0.5685019601 + "score":0.5596031593 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sd", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sd", "task":"translation_from", "metric":"bleu", - "score":0.4019575944 + "score":0.3271104301 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sd", "task":"translation_from", "metric":"chrf", - "score":0.6276858351 + "score":0.5357780664 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sd", "task":"translation_to", "metric":"bleu", - "score":0.3830695907 + "score":0.2320778637 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sd", "task":"translation_to", "metric":"chrf", - "score":0.5452929704 + "score":0.4100893183 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"si", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"si", "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"si", "task":"translation_from", "metric":"bleu", - "score":0.3256641934 + "score":0.2632131459 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"si", "task":"translation_from", "metric":"chrf", - "score":0.5531574071 + "score":0.4981476408 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"si", "task":"translation_to", "metric":"bleu", - "score":0.3465036043 + "score":0.3150668549 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"si", "task":"translation_to", "metric":"chrf", - "score":0.5339014715 + "score":0.466344362 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sn", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sn", "task":"mgsm", "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sn", "task":"mmlu", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sn", "task":"translation_from", "metric":"bleu", - "score":0.2148918029 + "score":0.1425864886 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sn", "task":"translation_from", "metric":"chrf", - "score":0.4431856714 + "score":0.3921687091 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sn", "task":"translation_to", "metric":"bleu", - "score":0.2048159746 + "score":0.1876717865 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sn", "task":"translation_to", "metric":"chrf", - "score":0.5229910344 + "score":0.4923376927 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"so", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"so", "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"so", "task":"translation_from", "metric":"bleu", - "score":0.3102660748 + "score":0.2921978364 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"so", "task":"translation_from", "metric":"chrf", - "score":0.5202647222 + "score":0.5121729513 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"so", "task":"translation_to", "metric":"bleu", - "score":0.2456069778 + "score":0.2437506181 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"so", "task":"translation_to", "metric":"chrf", - "score":0.503324615 + "score":0.511793128 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sr", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sr", "task":"mmlu", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sr", "task":"translation_from", "metric":"bleu", - "score":0.3298581842 + "score":0.3070769379 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sr", "task":"translation_from", "metric":"chrf", - "score":0.5870517038 + "score":0.5829431146 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sr", "task":"translation_to", "metric":"bleu", - "score":0.4507987284 + "score":0.4562210568 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sr", "task":"translation_to", "metric":"chrf", - "score":0.6306764686 + "score":0.6349957477 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"su", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"su", "task":"translation_from", "metric":"bleu", - "score":0.3438400948 + "score":0.2923338131 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"su", "task":"translation_from", "metric":"chrf", - "score":0.5431534783 + "score":0.4917795718 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"su", "task":"translation_to", "metric":"bleu", - "score":0.2185629205 + "score":0.2448808161 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"su", "task":"translation_to", "metric":"chrf", - "score":0.513335728 + "score":0.5213243396 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sv", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sv", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sv", "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sv", "task":"translation_from", "metric":"bleu", - "score":0.3332298772 + "score":0.340913979 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sv", "task":"translation_from", "metric":"chrf", - "score":0.5774389783 + "score":0.5878242881 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sv", "task":"translation_to", "metric":"bleu", - "score":0.4778984127 + "score":0.4428192719 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sv", "task":"translation_to", "metric":"chrf", - "score":0.6958168144 + "score":0.6769035337 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sw", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sw", "task":"mgsm", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sw", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.4452506057 + "score":0.3616286251 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.6299322033 + "score":0.5800788406 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sw", "task":"translation_to", "metric":"bleu", - "score":0.4773237879 + "score":0.4820281618 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"sw", "task":"translation_to", "metric":"chrf", - "score":0.6983325706 + "score":0.7239645292 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ta", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ta", "task":"translation_from", "metric":"bleu", - "score":0.2765535661 + "score":0.2700100505 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ta", "task":"translation_from", "metric":"chrf", - "score":0.5553462948 + "score":0.5372825559 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ta", "task":"translation_to", "metric":"bleu", - "score":0.3584530222 + "score":0.30759425 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ta", "task":"translation_to", "metric":"chrf", - "score":0.6096517359 + "score":0.5725597295 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"te", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"te", "task":"mgsm", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"te", "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.4838983303 + "score":0.4465523529 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.6878651593 + "score":0.6649928543 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"te", "task":"translation_to", "metric":"bleu", - "score":0.4225689448 + "score":0.4129762096 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"te", "task":"translation_to", "metric":"chrf", - "score":0.6171822766 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tg", - "task":"classification", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tg", - "task":"translation_from", - "metric":"bleu", - "score":0.2905859261 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tg", - "task":"translation_from", - "metric":"chrf", - "score":0.5219303661 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tg", - "task":"translation_to", - "metric":"bleu", - "score":0.3215838806 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"tg", - "task":"translation_to", - "metric":"chrf", - "score":0.5332721729 + "score":0.6159040363 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"th", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"th", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"th", "task":"translation_from", "metric":"bleu", - "score":0.363389223 + "score":0.3236889282 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"th", "task":"translation_from", "metric":"chrf", - "score":0.5927603201 + "score":0.562821135 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"th", "task":"translation_to", "metric":"bleu", - "score":0.4280908922 + "score":0.4114706745 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"th", "task":"translation_to", "metric":"chrf", - "score":0.5695430758 + "score":0.560767027 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ti", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ti", "task":"translation_from", "metric":"bleu", - "score":0.2870643832 + "score":0.2476296934 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ti", "task":"translation_from", "metric":"chrf", - "score":0.5217258722 + "score":0.5033069835 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ti", "task":"translation_to", "metric":"bleu", - "score":0.1683718664 + "score":0.1179117378 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"ti", "task":"translation_to", "metric":"chrf", - "score":0.2689944739 + "score":0.2587205011 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"tr", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"tr", "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"tr", "task":"translation_from", "metric":"bleu", - "score":0.3532965173 + "score":0.3291780472 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"tr", "task":"translation_from", "metric":"chrf", - "score":0.6170908018 + "score":0.5900439285 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"tr", "task":"translation_to", "metric":"bleu", - "score":0.4401941591 + "score":0.4285247051 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"tr", "task":"translation_to", "metric":"chrf", - "score":0.6752054069 + "score":0.6508035663 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"uk", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"uk", "task":"mmlu", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"uk", "task":"translation_from", "metric":"bleu", - "score":0.3183568029 + "score":0.3407035036 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"uk", "task":"translation_from", "metric":"chrf", - "score":0.569783479 + "score":0.583433778 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"uk", "task":"translation_to", "metric":"bleu", - "score":0.4278428166 + "score":0.4167194618 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"uk", "task":"translation_to", "metric":"chrf", - "score":0.6040719448 + "score":0.6135073244 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"umb", + "model":"google\/gemini-2.5-flash", + "bcp_47":"ur", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"umb", + "model":"google\/gemini-2.5-flash", + "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":0.037144113 + "score":0.3449466128 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"umb", + "model":"google\/gemini-2.5-flash", + "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":0.089331464 + "score":0.5552120384 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"umb", + "model":"google\/gemini-2.5-flash", + "bcp_47":"ur", "task":"translation_to", "metric":"bleu", - "score":0.0447156552 + "score":0.3046252906 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"umb", + "model":"google\/gemini-2.5-flash", + "bcp_47":"ur", "task":"translation_to", "metric":"chrf", - "score":0.2228994735 + "score":0.493749829 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", + "model":"google\/gemini-2.5-flash", + "bcp_47":"uz", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", + "model":"google\/gemini-2.5-flash", + "bcp_47":"uz", "task":"translation_from", "metric":"bleu", - "score":0.3194163699 + "score":0.2583582755 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", + "model":"google\/gemini-2.5-flash", + "bcp_47":"uz", "task":"translation_from", "metric":"chrf", - "score":0.5758075077 + "score":0.483302551 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", + "model":"google\/gemini-2.5-flash", + "bcp_47":"uz", "task":"translation_to", "metric":"bleu", - "score":0.2609063103 + "score":0.3579243963 }, { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"ur", + "model":"google\/gemini-2.5-flash", + "bcp_47":"uz", "task":"translation_to", "metric":"chrf", - "score":0.4351160146 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"uz", - "task":"classification", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"uz", - "task":"translation_from", - "metric":"bleu", - "score":0.3488574237 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"uz", - "task":"translation_from", - "metric":"chrf", - "score":0.5833892626 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"uz", - "task":"translation_to", - "metric":"bleu", - "score":0.3525318348 - }, - { - "model":"google\/gemini-2.5-flash-preview", - "bcp_47":"uz", - "task":"translation_to", - "metric":"chrf", - "score":0.600901419 + "score":0.6083657804 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"vi", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"vi", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.4227968054 + "score":0.3536805169 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.6326522416 + "score":0.589790723 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"vi", "task":"translation_to", "metric":"bleu", - "score":0.4693432911 + "score":0.4655851302 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"vi", "task":"translation_to", "metric":"chrf", - "score":0.6659480306 + "score":0.6703129046 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"wo", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"wo", "task":"mgsm", "metric":"accuracy", - "score":0.3 + "score":0.4 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"wo", "task":"mmlu", "metric":"accuracy", "score":0.5 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"wo", "task":"translation_from", "metric":"bleu", - "score":0.1552091518 + "score":0.0932068478 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"wo", "task":"translation_from", "metric":"chrf", - "score":0.3984533183 + "score":0.3792197219 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"wo", "task":"translation_to", "metric":"bleu", - "score":0.0934433089 + "score":0.1171143464 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"wo", "task":"translation_to", "metric":"chrf", - "score":0.3362523248 + "score":0.3384795969 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"wuu", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"wuu", "task":"translation_from", "metric":"bleu", - "score":0.3241760602 + "score":0.2793739299 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"wuu", "task":"translation_from", "metric":"chrf", - "score":0.5694459727 + "score":0.5145166794 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"wuu", "task":"translation_to", "metric":"bleu", - "score":0.1373684835 + "score":0.1321430026 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"wuu", "task":"translation_to", "metric":"chrf", - "score":0.1808455778 + "score":0.176594989 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"xh", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"xh", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"xh", "task":"mmlu", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"xh", "task":"translation_from", "metric":"bleu", - "score":0.2594184267 + "score":0.1979226992 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"xh", "task":"translation_from", "metric":"chrf", - "score":0.4970898641 + "score":0.4588070152 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"xh", "task":"translation_to", "metric":"bleu", - "score":0.1342973002 + "score":0.1181506898 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"xh", "task":"translation_to", "metric":"chrf", - "score":0.4760810578 + "score":0.4718021868 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"yo", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"yo", "task":"mgsm", "metric":"accuracy", - "score":0.6 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"yo", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"yo", "task":"translation_from", "metric":"bleu", - "score":0.1670055121 + "score":0.1110331374 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"yo", "task":"translation_from", "metric":"chrf", - "score":0.3949060751 + "score":0.3622261661 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"yo", "task":"translation_to", "metric":"bleu", - "score":0.1271782927 + "score":0.1764819134 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"yo", "task":"translation_to", "metric":"chrf", - "score":0.2784136749 + "score":0.3463753843 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"yue", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"yue", "task":"translation_from", "metric":"bleu", - "score":0.2666023686 + "score":0.2753706711 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"yue", "task":"translation_from", "metric":"chrf", - "score":0.5200218275 + "score":0.5198869679 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"yue", "task":"translation_to", "metric":"bleu", - "score":0.1881613886 + "score":0.2207873686 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"yue", "task":"translation_to", "metric":"chrf", - "score":0.2877597368 + "score":0.2915581098 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"zh", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"zh", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"zh", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.2632355471 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.5527183044 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"zh", "task":"translation_to", "metric":"bleu", - "score":0.3128970722 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"zh", "task":"translation_to", "metric":"chrf", - "score":0.3699956681 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"zu", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"zu", "task":"mgsm", "metric":"accuracy", - "score":0.6 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"zu", "task":"mmlu", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"zu", "task":"translation_from", "metric":"bleu", - "score":0.3295494586 + "score":0.3429319501 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"zu", "task":"translation_from", "metric":"chrf", - "score":0.557523684 + "score":0.5895603725 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"zu", "task":"translation_to", "metric":"bleu", - "score":0.3146714644 + "score":0.2713803282 }, { - "model":"google\/gemini-2.5-flash-preview", + "model":"google\/gemini-2.5-flash", "bcp_47":"zu", "task":"translation_to", "metric":"chrf", - "score":0.5811521396 + "score":0.5773152323 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"aeb", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"aeb", "task":"translation_from", "metric":"bleu", - "score":0.342116281 + "score":0.3214356805 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"aeb", "task":"translation_from", "metric":"chrf", - "score":0.559017125 + "score":0.5389152254 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"aeb", "task":"translation_to", "metric":"bleu", - "score":0.2612038772 + "score":0.2750202358 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"aeb", "task":"translation_to", "metric":"chrf", - "score":0.4610162591 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"af", - "task":"classification", - "metric":"accuracy", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"af", - "task":"translation_from", - "metric":"bleu", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"af", - "task":"translation_from", - "metric":"chrf", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"af", - "task":"translation_to", - "metric":"bleu", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"af", - "task":"translation_to", - "metric":"chrf", - "score":0.0 + "score":0.4582086461 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ak", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ak", "task":"mgsm", "metric":"accuracy", - "score":0.5 + "score":0.1 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ak", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.4 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ak", "task":"translation_from", "metric":"bleu", - "score":0.2362598693 + "score":0.2109602349 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ak", "task":"translation_from", "metric":"chrf", - "score":0.4567970323 + "score":0.4227618508 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ak", "task":"translation_to", "metric":"bleu", - "score":0.1615485704 + "score":0.0404862392 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ak", "task":"translation_to", "metric":"chrf", - "score":0.4248295507 + "score":0.2400991747 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"am", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"am", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.6 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"am", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.5 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"am", "task":"translation_from", "metric":"bleu", - "score":0.2883756135 + "score":0.2100947434 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"am", "task":"translation_from", "metric":"chrf", - "score":0.5452929372 + "score":0.4549390562 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"am", "task":"translation_to", "metric":"bleu", - "score":0.2563045907 + "score":0.2174710639 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"am", "task":"translation_to", "metric":"chrf", - "score":0.3587997566 + "score":0.3477622396 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"apc", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"apc", "task":"translation_from", "metric":"bleu", - "score":0.3529391424 + "score":0.3252857092 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"apc", "task":"translation_from", "metric":"chrf", - "score":0.6061230642 + "score":0.5932296006 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"apc", "task":"translation_to", "metric":"bleu", - "score":0.3735935027 + "score":0.3272191754 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"apc", "task":"translation_to", "metric":"chrf", - "score":0.6118752881 + "score":0.5729420593 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ar", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ar", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.3509446122 + "score":0.340834322 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.5872861306 + "score":0.5737255077 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ar", "task":"translation_to", "metric":"bleu", - "score":0.4369226272 + "score":0.400951924 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ar", "task":"translation_to", "metric":"chrf", - "score":0.6357392299 + "score":0.6055469967 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ary", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ary", "task":"translation_from", "metric":"bleu", - "score":0.178647434 + "score":0.1768177745 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ary", "task":"translation_from", "metric":"chrf", - "score":0.459184816 + "score":0.4206182999 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ary", "task":"translation_to", "metric":"bleu", - "score":0.1766325657 + "score":0.1661016339 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ary", "task":"translation_to", "metric":"chrf", - "score":0.42829263 + "score":0.4188678128 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"arz", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"arz", "task":"translation_from", "metric":"bleu", - "score":0.2689181562 + "score":0.2235509309 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"arz", "task":"translation_from", "metric":"chrf", - "score":0.5103302194 + "score":0.4602443001 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"arz", "task":"translation_to", "metric":"bleu", - "score":0.2811045733 + "score":0.2804587312 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"arz", "task":"translation_to", "metric":"chrf", - "score":0.4796679654 + "score":0.4871597651 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"as", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"as", "task":"translation_from", "metric":"bleu", - "score":0.302725237 + "score":0.2397743064 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"as", "task":"translation_from", "metric":"chrf", - "score":0.542445303 + "score":0.4543878112 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"as", "task":"translation_to", "metric":"bleu", - "score":0.2074435657 + "score":0.1148483938 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"as", "task":"translation_to", "metric":"chrf", - "score":0.4358785934 + "score":0.3729760244 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"awa", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"awa", "task":"translation_from", "metric":"bleu", - "score":0.3306584572 + "score":0.3589106841 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"awa", "task":"translation_from", "metric":"chrf", - "score":0.5470737398 + "score":0.5556934974 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"awa", "task":"translation_to", "metric":"bleu", - "score":0.1839015438 + "score":0.2194832094 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"awa", "task":"translation_to", "metric":"chrf", - "score":0.3995221223 + "score":0.4237879497 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"az", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"az", "task":"translation_from", "metric":"bleu", - "score":0.2402619776 + "score":0.2436266384 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"az", "task":"translation_from", "metric":"chrf", - "score":0.4816842061 + "score":0.4585679488 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"az", "task":"translation_to", "metric":"bleu", - "score":0.2017479595 + "score":0.1759303823 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"az", "task":"translation_to", "metric":"chrf", - "score":0.4438028104 + "score":0.4132301771 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"be", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"be", "task":"translation_from", "metric":"bleu", - "score":0.1964434077 + "score":0.2386849466 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"be", "task":"translation_from", "metric":"chrf", - "score":0.4658109118 + "score":0.5137963545 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"be", "task":"translation_to", "metric":"bleu", - "score":0.3578761246 + "score":0.2980098252 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"be", "task":"translation_to", "metric":"chrf", - "score":0.5250650323 + "score":0.4897189336 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"bho", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"bho", "task":"translation_from", "metric":"bleu", - "score":0.3118354834 + "score":0.2783242324 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"bho", "task":"translation_from", "metric":"chrf", - "score":0.5301057957 + "score":0.5195378813 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"bho", "task":"translation_to", "metric":"bleu", - "score":0.2712094702 + "score":0.2287943315 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"bho", "task":"translation_to", "metric":"chrf", - "score":0.4554148161 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"bm", - "task":"classification", - "metric":"accuracy", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"bm", - "task":"translation_from", - "metric":"bleu", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"bm", - "task":"translation_from", - "metric":"chrf", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"bm", - "task":"translation_to", - "metric":"bleu", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"bm", - "task":"translation_to", - "metric":"chrf", - "score":0.0 + "score":0.3991318481 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"bn", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"bn", "task":"mgsm", "metric":"accuracy", - "score":0.5 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"bn", "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.2928560114 + "score":0.3084224404 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.5373877759 + "score":0.5121932853 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"bn", "task":"translation_to", "metric":"bleu", - "score":0.371713483 + "score":0.3583142434 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"bn", "task":"translation_to", "metric":"chrf", - "score":0.5467648432 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ca", - "task":"classification", - "metric":"accuracy", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ca", - "task":"translation_from", - "metric":"bleu", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ca", - "task":"translation_from", - "metric":"chrf", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ca", - "task":"translation_to", - "metric":"bleu", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ca", - "task":"translation_to", - "metric":"chrf", - "score":0.0 + "score":0.4775479891 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ceb", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ceb", "task":"translation_from", "metric":"bleu", - "score":0.4167458111 + "score":0.4286119986 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ceb", "task":"translation_from", "metric":"chrf", - "score":0.6414773714 + "score":0.6255932052 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ceb", "task":"translation_to", "metric":"bleu", - "score":0.4574369641 + "score":0.4113289392 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ceb", "task":"translation_to", "metric":"chrf", - "score":0.6642298649 + "score":0.6280056275 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ckb", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ckb", "task":"translation_from", "metric":"bleu", - "score":0.3171272191 + "score":0.3024735136 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ckb", "task":"translation_from", "metric":"chrf", - "score":0.5378911972 + "score":0.5519071111 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ckb", "task":"translation_to", "metric":"bleu", - "score":0.3576320675 + "score":0.2912283609 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ckb", "task":"translation_to", "metric":"chrf", - "score":0.5996552124 + "score":0.5457169481 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"cs", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"cs", "task":"mgsm", "metric":"accuracy", "score":0.7 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"cs", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.7 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"cs", "task":"translation_from", "metric":"bleu", - "score":0.3763167038 + "score":0.3674320384 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"cs", "task":"translation_from", "metric":"chrf", - "score":0.6069984198 + "score":0.6093254166 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"cs", "task":"translation_to", "metric":"bleu", - "score":0.412011399 + "score":0.428984445 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"cs", "task":"translation_to", "metric":"chrf", - "score":0.5948875971 + "score":0.6342524948 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"de", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"de", "task":"mgsm", "metric":"accuracy", - "score":0.3 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"de", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.7 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.3827187056 + "score":0.3721804398 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.6092943987 + "score":0.5986155742 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"de", "task":"translation_to", "metric":"bleu", - "score":0.5181328066 + "score":0.4694707802 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"de", "task":"translation_to", "metric":"chrf", - "score":0.6981190119 + "score":0.6759134793 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"el", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"el", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"el", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.7 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"el", "task":"translation_from", "metric":"bleu", - "score":0.3297475202 + "score":0.3106447069 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"el", "task":"translation_from", "metric":"chrf", - "score":0.5587828835 + "score":0.5288637721 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"el", "task":"translation_to", "metric":"bleu", - "score":0.3865296224 + "score":0.3186331513 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"el", "task":"translation_to", "metric":"chrf", - "score":0.5630460332 + "score":0.5226733847 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"en", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"en", "task":"mgsm", "metric":"accuracy", - "score":0.1 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"en", "task":"mmlu", "metric":"accuracy", - "score":1.0 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.5942868447 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.7298379077 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"en", "task":"translation_to", "metric":"bleu", - "score":0.7309888475 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"en", "task":"translation_to", "metric":"chrf", - "score":0.8534239972 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"es", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"es", "task":"mgsm", "metric":"accuracy", - "score":0.3 + "score":0.7 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"es", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.3497891701 + "score":0.3582552616 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.5889817614 + "score":0.5871323046 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"es", "task":"translation_to", "metric":"bleu", - "score":0.395885417 + "score":0.3814015085 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"es", "task":"translation_to", "metric":"chrf", - "score":0.6273835234 + "score":0.6114167807 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"fa", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"fa", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"fa", "task":"translation_from", "metric":"bleu", - "score":0.3764428485 + "score":0.3270323847 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"fa", "task":"translation_from", "metric":"chrf", - "score":0.5794911256 + "score":0.5649606293 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"fa", "task":"translation_to", "metric":"bleu", - "score":0.3019679958 + "score":0.1269608883 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"fa", "task":"translation_to", "metric":"chrf", - "score":0.5314471888 + "score":0.3031131479 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"fil", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"fil", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.7 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"fil", "task":"translation_from", "metric":"bleu", - "score":0.3970330872 + "score":0.4349803398 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"fil", "task":"translation_from", "metric":"chrf", - "score":0.6224300541 + "score":0.6438510394 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"fil", "task":"translation_to", "metric":"bleu", - "score":0.3731416111 + "score":0.3272281283 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"fil", "task":"translation_to", "metric":"chrf", - "score":0.6421804886 + "score":0.6093718119 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"fr", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"fr", "task":"mgsm", "metric":"accuracy", - "score":0.5 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"fr", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.3737227872 + "score":0.3355416948 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.6039484183 + "score":0.5838841123 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"fr", "task":"translation_to", "metric":"bleu", - "score":0.5555743798 + "score":0.584133096 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"fr", "task":"translation_to", "metric":"chrf", - "score":0.7229519037 + "score":0.7456335449 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"fuv", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"fuv", "task":"translation_from", "metric":"bleu", - "score":0.0654195918 + "score":0.0679142153 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"fuv", "task":"translation_from", "metric":"chrf", - "score":0.2431272498 + "score":0.2031626473 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"fuv", "task":"translation_to", "metric":"bleu", - "score":0.0469027058 + "score":0.0290719162 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"fuv", "task":"translation_to", "metric":"chrf", - "score":0.2599881115 + "score":0.1889337147 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"gu", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"gu", "task":"translation_from", "metric":"bleu", - "score":0.344471287 + "score":0.3611805314 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"gu", "task":"translation_from", "metric":"chrf", - "score":0.5591834446 + "score":0.5752776482 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"gu", "task":"translation_to", "metric":"bleu", - "score":0.180119873 + "score":0.2391737378 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"gu", "task":"translation_to", "metric":"chrf", - "score":0.4654772276 + "score":0.4921903256 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ha", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ha", "task":"mgsm", "metric":"accuracy", - "score":0.5 + "score":0.4 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ha", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.6 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ha", "task":"translation_from", "metric":"bleu", - "score":0.2852268084 + "score":0.1621381069 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ha", "task":"translation_from", "metric":"chrf", - "score":0.4820918601 + "score":0.3417931875 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ha", "task":"translation_to", "metric":"bleu", - "score":0.318588004 + "score":0.2717034881 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ha", "task":"translation_to", "metric":"chrf", - "score":0.5675346049 + "score":0.5355442254 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"hi", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.4 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"hi", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.4 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.4387215588 + "score":0.204393553 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.6443095169 + "score":0.2745286065 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"hi", "task":"translation_to", "metric":"bleu", - "score":0.4255607348 + "score":0.1816643198 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"hi", "task":"translation_to", "metric":"chrf", - "score":0.6457270128 + "score":0.2510224378 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"hne", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"hne", "task":"translation_from", "metric":"bleu", - "score":0.336133928 + "score":0.2859347325 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"hne", "task":"translation_from", "metric":"chrf", - "score":0.545638091 + "score":0.5184335371 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"hne", "task":"translation_to", "metric":"bleu", - "score":0.1683321583 + "score":0.1342367179 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"hne", "task":"translation_to", "metric":"chrf", - "score":0.4261207547 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ht", - "task":"classification", - "metric":"accuracy", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ht", - "task":"translation_from", - "metric":"bleu", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ht", - "task":"translation_from", - "metric":"chrf", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ht", - "task":"translation_to", - "metric":"bleu", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ht", - "task":"translation_to", - "metric":"chrf", - "score":0.0 + "score":0.4184241385 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"hu", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"hu", "task":"mgsm", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"hu", "task":"translation_from", "metric":"bleu", - "score":0.3151646581 + "score":0.2730596822 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"hu", "task":"translation_from", "metric":"chrf", - "score":0.5599039863 + "score":0.5317268553 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"hu", "task":"translation_to", "metric":"bleu", - "score":0.4642022823 + "score":0.3637494619 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"hu", "task":"translation_to", "metric":"chrf", - "score":0.6720003623 + "score":0.6185991628 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"id", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"id", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.3789722313 + "score":0.2861788949 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.5973074889 + "score":0.5319409537 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"id", "task":"translation_to", "metric":"bleu", - "score":0.406320567 + "score":0.3948709187 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"id", "task":"translation_to", "metric":"chrf", - "score":0.6828299565 + "score":0.6780004275 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ig", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ig", "task":"mgsm", "metric":"accuracy", - "score":0.4 + "score":0.3 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ig", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.4 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ig", "task":"translation_from", "metric":"bleu", - "score":0.2779082008 + "score":0.3188972215 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ig", "task":"translation_from", "metric":"chrf", - "score":0.5108078595 + "score":0.5295590822 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ig", "task":"translation_to", "metric":"bleu", - "score":0.2835120188 + "score":0.2811967075 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ig", "task":"translation_to", "metric":"chrf", - "score":0.5067796001 + "score":0.501183428 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ilo", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ilo", "task":"translation_from", "metric":"bleu", - "score":0.2679844764 + "score":0.2118796398 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ilo", "task":"translation_from", "metric":"chrf", - "score":0.5037933164 + "score":0.4066989348 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ilo", "task":"translation_to", "metric":"bleu", - "score":0.243508886 + "score":0.2037665999 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ilo", "task":"translation_to", "metric":"chrf", - "score":0.5329216971 + "score":0.482790382 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"it", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"it", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"it", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.6 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"it", "task":"translation_from", "metric":"bleu", - "score":0.3177725576 + "score":0.2760607852 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"it", "task":"translation_from", "metric":"chrf", - "score":0.5648818053 + "score":0.505931568 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"it", "task":"translation_to", "metric":"bleu", - "score":0.3654943432 + "score":0.3710768942 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"it", "task":"translation_to", "metric":"chrf", - "score":0.5949572053 + "score":0.6060706251 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ja", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ja", "task":"mgsm", "metric":"accuracy", - "score":0.5 + "score":0.6 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ja", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.3423388267 + "score":0.2758724437 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.5884893314 + "score":0.530496596 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ja", "task":"translation_to", "metric":"bleu", - "score":0.3740472584 + "score":0.3593357374 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ja", "task":"translation_to", "metric":"chrf", - "score":0.4832664839 + "score":0.4976294688 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"jv", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.3540174328 + "score":0.315340995 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.5513315973 + "score":0.4928049131 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"jv", "task":"translation_to", "metric":"bleu", - "score":0.329885986 + "score":0.2934453399 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"jv", "task":"translation_to", "metric":"chrf", - "score":0.5805485408 + "score":0.5856216725 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ki", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", + "bcp_47":"kk", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ki", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", + "bcp_47":"kk", "task":"translation_from", "metric":"bleu", - "score":0.0 + "score":0.2394833815 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ki", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", + "bcp_47":"kk", "task":"translation_from", "metric":"chrf", - "score":0.0 + "score":0.5242453646 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ki", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", + "bcp_47":"kk", "task":"translation_to", "metric":"bleu", - "score":0.0 + "score":0.3207384881 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ki", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", + "bcp_47":"kk", "task":"translation_to", "metric":"chrf", - "score":0.0 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"kk", - "task":"classification", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"kk", - "task":"translation_from", - "metric":"bleu", - "score":0.2553025069 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"kk", - "task":"translation_from", - "metric":"chrf", - "score":0.5408614418 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"kk", - "task":"translation_to", - "metric":"bleu", - "score":0.3062994849 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"kk", - "task":"translation_to", - "metric":"chrf", - "score":0.58504635 + "score":0.5956517338 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"km", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"km", "task":"translation_from", "metric":"bleu", - "score":0.3700483899 + "score":0.386478574 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"km", "task":"translation_from", "metric":"chrf", - "score":0.6006134318 + "score":0.6064526195 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"km", "task":"translation_to", "metric":"bleu", - "score":0.2315452529 + "score":0.1902174551 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"km", "task":"translation_to", "metric":"chrf", - "score":0.4617416997 + "score":0.4077331961 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"kn", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"kn", "task":"translation_from", "metric":"bleu", - "score":0.2512885128 + "score":0.2683427219 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"kn", "task":"translation_from", "metric":"chrf", - "score":0.4934774392 + "score":0.4680683679 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"kn", "task":"translation_to", "metric":"bleu", - "score":0.3278617048 + "score":0.3074724881 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"kn", "task":"translation_to", "metric":"chrf", - "score":0.5102619479 + "score":0.525017962 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ko", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ko", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ko", "task":"translation_from", "metric":"bleu", - "score":0.2465751079 + "score":0.2928122517 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ko", "task":"translation_from", "metric":"chrf", - "score":0.515705028 + "score":0.5280367109 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ko", "task":"translation_to", "metric":"bleu", - "score":0.2528779436 + "score":0.2635968583 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ko", "task":"translation_to", "metric":"chrf", - "score":0.3488788279 + "score":0.3368468321 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"lua", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"lua", "task":"translation_from", "metric":"bleu", - "score":0.0591613845 + "score":0.1231771445 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"lua", "task":"translation_from", "metric":"chrf", - "score":0.2662007935 + "score":0.3217080826 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"lua", "task":"translation_to", "metric":"bleu", - "score":0.0779434955 + "score":0.0773328896 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"lua", "task":"translation_to", "metric":"chrf", - "score":0.3095367271 + "score":0.1832969439 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"mag", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"mag", "task":"translation_from", "metric":"bleu", - "score":0.3908377774 + "score":0.3697289109 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"mag", "task":"translation_from", "metric":"chrf", - "score":0.6260985434 + "score":0.6084180116 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"mag", "task":"translation_to", "metric":"bleu", - "score":0.3130016025 + "score":0.2613138272 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"mag", "task":"translation_to", "metric":"chrf", - "score":0.5391710538 + "score":0.5073964951 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"mai", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"mai", "task":"translation_from", "metric":"bleu", - "score":0.3471192 + "score":0.3625690158 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"mai", "task":"translation_from", "metric":"chrf", - "score":0.5771683143 + "score":0.6006670528 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"mai", "task":"translation_to", "metric":"bleu", - "score":0.2207082106 + "score":0.1897823417 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"mai", "task":"translation_to", "metric":"chrf", - "score":0.4870892013 + "score":0.4297277988 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"mg", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"mg", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.3 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"mg", "task":"translation_from", "metric":"bleu", - "score":0.2993063676 + "score":0.3313910493 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"mg", "task":"translation_from", "metric":"chrf", - "score":0.5474937127 + "score":0.5527395882 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"mg", "task":"translation_to", "metric":"bleu", - "score":0.2153101678 + "score":0.1964447176 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"mg", "task":"translation_to", "metric":"chrf", - "score":0.5379094165 + "score":0.5296015703 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ml", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ml", "task":"translation_from", "metric":"bleu", - "score":0.3532448793 + "score":0.3414148257 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ml", "task":"translation_from", "metric":"chrf", - "score":0.5657281022 + "score":0.5540910618 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ml", "task":"translation_to", "metric":"bleu", - "score":0.3046979511 + "score":0.3057528343 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ml", "task":"translation_to", "metric":"chrf", - "score":0.5523287159 + "score":0.5632066271 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"mr", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.3055522766 + "score":0.3287215168 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.5435968357 + "score":0.5519425018 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"mr", "task":"translation_to", "metric":"bleu", - "score":0.257460039 + "score":0.2304519892 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"mr", "task":"translation_to", "metric":"chrf", - "score":0.4845716024 + "score":0.4989319097 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ms", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ms", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.6 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ms", "task":"translation_from", "metric":"bleu", - "score":0.3746934831 + "score":0.3465169139 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ms", "task":"translation_from", "metric":"chrf", - "score":0.6046609636 + "score":0.5808747364 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ms", "task":"translation_to", "metric":"bleu", - "score":0.4734156929 + "score":0.4158487664 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ms", "task":"translation_to", "metric":"chrf", - "score":0.7284733826 + "score":0.6600695767 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"my", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"my", "task":"translation_from", "metric":"bleu", - "score":0.3552781219 + "score":0.2409863105 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"my", "task":"translation_from", "metric":"chrf", - "score":0.5977013775 + "score":0.5202354498 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"my", "task":"translation_to", "metric":"bleu", - "score":0.3211140622 + "score":0.2411557102 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"my", "task":"translation_to", "metric":"chrf", - "score":0.544805929 + "score":0.5039906236 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ne", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ne", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ne", "task":"translation_from", "metric":"bleu", - "score":0.3774439938 + "score":0.3815914252 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ne", "task":"translation_from", "metric":"chrf", - "score":0.599804205 + "score":0.6033151685 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ne", "task":"translation_to", "metric":"bleu", - "score":0.2861323795 + "score":0.2704724871 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ne", "task":"translation_to", "metric":"chrf", - "score":0.5180107937 + "score":0.5377831174 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"nl", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"nl", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.6 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"nl", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"nl", "task":"translation_from", "metric":"bleu", - "score":0.312116976 + "score":0.2902133526 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"nl", "task":"translation_from", "metric":"chrf", - "score":0.5463170004 + "score":0.5026903639 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"nl", "task":"translation_to", "metric":"bleu", - "score":0.3780530389 + "score":0.3708860145 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"nl", "task":"translation_to", "metric":"chrf", - "score":0.6232733213 + "score":0.6406384923 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ny", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ny", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.6 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ny", "task":"translation_from", "metric":"bleu", - "score":0.2177968416 + "score":0.1681187244 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ny", "task":"translation_from", "metric":"chrf", - "score":0.4415294523 + "score":0.4132334642 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ny", "task":"translation_to", "metric":"bleu", - "score":0.1367315108 + "score":0.247731261 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ny", "task":"translation_to", "metric":"chrf", - "score":0.4585024296 + "score":0.551241939 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"om", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"om", "task":"mgsm", "metric":"accuracy", - "score":0.3 + "score":0.2 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"om", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.6 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"om", "task":"translation_from", "metric":"bleu", - "score":0.1871006972 + "score":0.077753472 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"om", "task":"translation_from", "metric":"chrf", - "score":0.4365658925 + "score":0.2855262128 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"om", "task":"translation_to", "metric":"bleu", - "score":0.106229994 + "score":0.0121360259 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"om", "task":"translation_to", "metric":"chrf", - "score":0.4277182017 + "score":0.2491350822 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"or", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"or", "task":"translation_from", "metric":"bleu", - "score":0.3740486194 + "score":0.3515785998 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"or", "task":"translation_from", "metric":"chrf", - "score":0.6141131486 + "score":0.5611231864 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"or", "task":"translation_to", "metric":"bleu", - "score":0.31231668 + "score":0.243065872 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"or", "task":"translation_to", "metric":"chrf", - "score":0.5222572922 + "score":0.4461879463 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"pa", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.4182659606 + "score":0.4636008739 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.6696655487 + "score":0.6571795999 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"pa", "task":"translation_to", "metric":"bleu", - "score":0.4665320226 + "score":0.4815076037 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"pa", "task":"translation_to", "metric":"chrf", - "score":0.6280330147 + "score":0.6245096256 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"pl", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"pl", "task":"mgsm", "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"pl", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"pl", "task":"translation_from", "metric":"bleu", - "score":0.3282584844 + "score":0.2488462209 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"pl", "task":"translation_from", "metric":"chrf", - "score":0.5713765921 + "score":0.4964581993 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"pl", "task":"translation_to", "metric":"bleu", - "score":0.3762753954 + "score":0.3733344795 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"pl", "task":"translation_to", "metric":"chrf", - "score":0.5940500139 + "score":0.5954877296 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"pt", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"pt", "task":"mmlu", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.3485890022 + "score":0.3330604616 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.574915747 + "score":0.5424702945 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.4760104707 + "score":0.5373180666 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.6891420805 + "score":0.7255352889 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ro", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ro", "task":"mgsm", "metric":"accuracy", "score":0.7 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ro", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ro", "task":"translation_from", "metric":"bleu", - "score":0.3285564053 + "score":0.3593667369 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ro", "task":"translation_from", "metric":"chrf", - "score":0.5835489949 + "score":0.591533276 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ro", "task":"translation_to", "metric":"bleu", - "score":0.5863602394 + "score":0.534185929 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ro", "task":"translation_to", "metric":"chrf", - "score":0.7345305045 + "score":0.6955454677 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ru", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ru", "task":"mgsm", "metric":"accuracy", - "score":0.6 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ru", "task":"mmlu", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.2893557086 + "score":0.2611217724 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.5514512546 + "score":0.5239835944 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ru", "task":"translation_to", "metric":"bleu", - "score":0.4910352633 + "score":0.505609426 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ru", "task":"translation_to", "metric":"chrf", - "score":0.6636379715 + "score":0.6621791743 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"rw", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"rw", "task":"mgsm", "metric":"accuracy", "score":0.3 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"rw", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.3 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"rw", "task":"translation_from", "metric":"bleu", - "score":0.2768738298 + "score":0.2495091982 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"rw", "task":"translation_from", "metric":"chrf", - "score":0.5136190092 + "score":0.5003958033 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"rw", "task":"translation_to", "metric":"bleu", - "score":0.2743310586 + "score":0.3005818546 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"rw", "task":"translation_to", "metric":"chrf", - "score":0.5596031593 + "score":0.5528069872 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sd", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sd", "task":"translation_from", "metric":"bleu", - "score":0.3296224998 + "score":0.3232854235 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sd", "task":"translation_from", "metric":"chrf", - "score":0.5499189472 + "score":0.5338248863 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sd", "task":"translation_to", "metric":"bleu", - "score":0.2231786181 + "score":0.3633825131 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sd", "task":"translation_to", "metric":"chrf", - "score":0.407169401 + "score":0.518082708 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"si", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"si", "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"si", "task":"translation_from", "metric":"bleu", - "score":0.2632131459 + "score":0.2404030471 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"si", "task":"translation_from", "metric":"chrf", - "score":0.4981476408 + "score":0.4450495787 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"si", "task":"translation_to", "metric":"bleu", - "score":0.3150668549 + "score":0.2633769041 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"si", "task":"translation_to", "metric":"chrf", - "score":0.466344362 + "score":0.4000779424 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sn", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sn", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.5 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sn", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.6 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sn", "task":"translation_from", "metric":"bleu", - "score":0.1425864886 + "score":0.205986784 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sn", "task":"translation_from", "metric":"chrf", - "score":0.3921687091 + "score":0.4106144312 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sn", "task":"translation_to", "metric":"bleu", - "score":0.1876717865 + "score":0.1497281223 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sn", "task":"translation_to", "metric":"chrf", - "score":0.4923376927 + "score":0.4632023951 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"so", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"so", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.7 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"so", "task":"translation_from", "metric":"bleu", - "score":0.2921978364 + "score":0.1962561381 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"so", "task":"translation_from", "metric":"chrf", - "score":0.5121729513 + "score":0.3988286397 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"so", "task":"translation_to", "metric":"bleu", - "score":0.2437506181 + "score":0.1950290677 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"so", "task":"translation_to", "metric":"chrf", - "score":0.511793128 + "score":0.471168865 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sr", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sr", "task":"mmlu", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sr", "task":"translation_from", "metric":"bleu", - "score":0.3070769379 + "score":0.3514693093 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sr", "task":"translation_from", "metric":"chrf", - "score":0.5829431146 + "score":0.6142503501 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sr", "task":"translation_to", "metric":"bleu", - "score":0.4562210568 + "score":0.4078134146 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sr", "task":"translation_to", "metric":"chrf", - "score":0.6349957477 + "score":0.5830477251 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"su", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"su", "task":"translation_from", "metric":"bleu", - "score":0.2923338131 + "score":0.302260643 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"su", "task":"translation_from", "metric":"chrf", - "score":0.4917795718 + "score":0.4726767086 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"su", "task":"translation_to", "metric":"bleu", - "score":0.2448808161 + "score":0.2173421081 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"su", "task":"translation_to", "metric":"chrf", - "score":0.5213243396 + "score":0.5076467392 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sv", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sv", "task":"mgsm", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sv", "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sv", "task":"translation_from", "metric":"bleu", - "score":0.340913979 + "score":0.3465319309 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sv", "task":"translation_from", "metric":"chrf", - "score":0.5878242881 + "score":0.5749229816 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sv", "task":"translation_to", "metric":"bleu", - "score":0.4174508433 + "score":0.427946599 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sv", "task":"translation_to", "metric":"chrf", - "score":0.6558948574 + "score":0.6561517251 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sw", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sw", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sw", "task":"mmlu", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.397583037 + "score":0.3644616187 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.6014699575 + "score":0.5756919768 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sw", "task":"translation_to", "metric":"bleu", - "score":0.4540021563 + "score":0.4348964758 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"sw", "task":"translation_to", "metric":"chrf", - "score":0.7002830052 + "score":0.6695951707 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ta", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ta", "task":"translation_from", "metric":"bleu", - "score":0.2981018347 + "score":0.2833908051 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ta", "task":"translation_from", "metric":"chrf", - "score":0.5573394656 + "score":0.5256006446 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ta", "task":"translation_to", "metric":"bleu", - "score":0.3033361537 + "score":0.295190519 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ta", "task":"translation_to", "metric":"chrf", - "score":0.5406646936 + "score":0.5552708257 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"te", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"te", "task":"mgsm", "metric":"accuracy", - "score":0.1 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"te", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.6 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.4025505277 + "score":0.420625812 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.6339036498 + "score":0.6022558329 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"te", "task":"translation_to", "metric":"bleu", - "score":0.4166086163 + "score":0.402616087 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"te", "task":"translation_to", "metric":"chrf", - "score":0.6171953291 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"tg", - "task":"classification", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"tg", - "task":"translation_from", - "metric":"bleu", - "score":0.2859260679 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"tg", - "task":"translation_from", - "metric":"chrf", - "score":0.5305344486 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"tg", - "task":"translation_to", - "metric":"bleu", - "score":0.3454858711 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"tg", - "task":"translation_to", - "metric":"chrf", - "score":0.5585923193 + "score":0.593002412 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"th", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"th", "task":"mgsm", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"th", "task":"translation_from", "metric":"bleu", - "score":0.3196721957 + "score":0.2920493848 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"th", "task":"translation_from", "metric":"chrf", - "score":0.5597673276 + "score":0.5466007251 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"th", "task":"translation_to", "metric":"bleu", - "score":0.4114706745 + "score":0.3859165101 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"th", "task":"translation_to", "metric":"chrf", - "score":0.560767027 + "score":0.5519266683 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ti", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ti", "task":"translation_from", "metric":"bleu", - "score":0.2476296934 + "score":0.2361795584 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ti", "task":"translation_from", "metric":"chrf", - "score":0.5033069835 + "score":0.423037727 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ti", "task":"translation_to", "metric":"bleu", - "score":0.1179117378 + "score":0.1171487104 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ti", "task":"translation_to", "metric":"chrf", - "score":0.2587205011 + "score":0.2151258274 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"tr", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"tr", "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"tr", "task":"translation_from", "metric":"bleu", - "score":0.3291780472 + "score":0.3232096665 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"tr", "task":"translation_from", "metric":"chrf", - "score":0.5900439285 + "score":0.565658608 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"tr", "task":"translation_to", "metric":"bleu", - "score":0.4285247051 + "score":0.3961318349 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"tr", "task":"translation_to", "metric":"chrf", - "score":0.6508035663 + "score":0.6418401217 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"uk", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"uk", "task":"mmlu", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"uk", "task":"translation_from", "metric":"bleu", - "score":0.3407035036 + "score":0.3098191173 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"uk", "task":"translation_from", "metric":"chrf", - "score":0.583433778 + "score":0.5405005226 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"uk", "task":"translation_to", "metric":"bleu", - "score":0.4167194618 + "score":0.4237145042 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"uk", "task":"translation_to", "metric":"chrf", - "score":0.6135073244 + "score":0.5745094679 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"umb", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", + "bcp_47":"ur", "task":"classification", "metric":"accuracy", - "score":0.7 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"umb", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", + "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":0.0287200326 + "score":0.3505799794 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"umb", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", + "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":0.1566177223 + "score":0.5928594723 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"umb", - "task":"translation_to", - "metric":"bleu", - "score":0.0503465615 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"umb", - "task":"translation_to", - "metric":"chrf", - "score":0.21805483 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ur", - "task":"translation_from", - "metric":"bleu", - "score":0.3212777323 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", - "bcp_47":"ur", - "task":"translation_from", - "metric":"chrf", - "score":0.5735084601 - }, - { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ur", "task":"translation_to", "metric":"bleu", - "score":0.3027958989 + "score":0.3049544641 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"ur", "task":"translation_to", "metric":"chrf", - "score":0.4912965943 + "score":0.4891357222 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"uz", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"uz", "task":"translation_from", "metric":"bleu", - "score":0.2583582755 + "score":0.3150100377 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"uz", "task":"translation_from", "metric":"chrf", - "score":0.483302551 + "score":0.5577978212 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"uz", "task":"translation_to", "metric":"bleu", - "score":0.3579243963 + "score":0.3047703558 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"uz", "task":"translation_to", "metric":"chrf", - "score":0.6083657804 + "score":0.5585171573 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"vi", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"vi", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.6 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.3471784526 + "score":0.3426773013 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.5719753053 + "score":0.5563179871 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"vi", "task":"translation_to", "metric":"bleu", - "score":0.4601231177 + "score":0.435916799 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"vi", "task":"translation_to", "metric":"chrf", - "score":0.6644848789 + "score":0.6514701627 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"wo", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"wo", "task":"mgsm", "metric":"accuracy", - "score":0.4 + "score":0.1 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"wo", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.2 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"wo", "task":"translation_from", "metric":"bleu", - "score":0.0932068478 + "score":0.1075258999 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"wo", "task":"translation_from", "metric":"chrf", - "score":0.3792197219 + "score":0.3177870837 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"wo", "task":"translation_to", "metric":"bleu", - "score":0.1171143464 + "score":0.0558894656 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"wo", "task":"translation_to", "metric":"chrf", - "score":0.3384795969 + "score":0.1904131636 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"wuu", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"wuu", "task":"translation_from", "metric":"bleu", - "score":0.2968992777 + "score":0.2535066622 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"wuu", "task":"translation_from", "metric":"chrf", - "score":0.5258850631 + "score":0.4977368741 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"wuu", "task":"translation_to", "metric":"bleu", - "score":0.1321430026 + "score":0.1296483018 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"wuu", "task":"translation_to", "metric":"chrf", - "score":0.176594989 + "score":0.1831676522 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"xh", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"xh", "task":"mgsm", "metric":"accuracy", - "score":0.6 + "score":0.5 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"xh", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"xh", "task":"translation_from", "metric":"bleu", - "score":0.1979226992 + "score":0.260645909 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"xh", "task":"translation_from", "metric":"chrf", - "score":0.4588070152 + "score":0.4857479623 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"xh", "task":"translation_to", "metric":"bleu", - "score":0.1181506898 + "score":0.0868490585 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"xh", "task":"translation_to", "metric":"chrf", - "score":0.4718021868 + "score":0.4297420084 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"yo", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"yo", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.4 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"yo", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.4 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"yo", "task":"translation_from", "metric":"bleu", - "score":0.1110331374 + "score":0.1383444474 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"yo", "task":"translation_from", "metric":"chrf", - "score":0.3622261661 + "score":0.363924587 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"yo", "task":"translation_to", "metric":"bleu", - "score":0.1764819134 + "score":0.1077842587 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"yo", "task":"translation_to", "metric":"chrf", - "score":0.3463753843 + "score":0.2964363774 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"yue", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"yue", "task":"translation_from", "metric":"bleu", - "score":0.2756047962 + "score":0.2602982164 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"yue", "task":"translation_from", "metric":"chrf", - "score":0.518253876 + "score":0.5072059049 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"yue", "task":"translation_to", "metric":"bleu", - "score":0.2356751392 + "score":0.2013964224 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"yue", "task":"translation_to", "metric":"chrf", - "score":0.3051882861 + "score":0.2554887406 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"zh", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"zh", "task":"mgsm", "metric":"accuracy", - "score":0.4 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"zh", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.2989639846 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.5646599732 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"zh", "task":"translation_to", "metric":"bleu", - "score":0.2915310914 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"zh", "task":"translation_to", "metric":"chrf", - "score":0.3358004159 + "score":0.0 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"zu", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"zu", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.6 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"zu", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.6 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"zu", "task":"translation_from", "metric":"bleu", - "score":0.3429319501 + "score":0.2804680604 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"zu", "task":"translation_from", "metric":"chrf", - "score":0.5895603725 + "score":0.5519773239 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"zu", "task":"translation_to", "metric":"bleu", - "score":0.2713803282 + "score":0.250972384 }, { - "model":"google\/gemini-2.5-flash-preview-05-20", + "model":"google\/gemini-2.5-flash-lite-preview-06-17", "bcp_47":"zu", "task":"translation_to", "metric":"chrf", - "score":0.5773152323 + "score":0.5466457559 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"aeb", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"aeb", "task":"translation_from", "metric":"bleu", - "score":0.0278093886 + "score":0.3519233265 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"aeb", "task":"translation_from", "metric":"chrf", - "score":0.1209403877 + "score":0.5745897235 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"aeb", "task":"translation_to", "metric":"bleu", - "score":0.0460469917 + "score":0.2759791384 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"aeb", "task":"translation_to", "metric":"chrf", - "score":0.1583874959 + "score":0.4854942304 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"af", "task":"classification", "metric":"accuracy", "score":0.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"af", "task":"translation_from", "metric":"bleu", "score":0.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"af", "task":"translation_from", "metric":"chrf", "score":0.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"af", "task":"translation_to", "metric":"bleu", "score":0.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"af", "task":"translation_to", "metric":"chrf", "score":0.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ak", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ak", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":0.4 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ak", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.7 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ak", "task":"translation_from", "metric":"bleu", - "score":0.0746358572 + "score":0.2615212462 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ak", "task":"translation_from", "metric":"chrf", - "score":0.2039454163 + "score":0.4896634905 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ak", "task":"translation_to", "metric":"bleu", - "score":0.0106555853 + "score":0.1667049515 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ak", "task":"translation_to", "metric":"chrf", - "score":0.1635891431 + "score":0.4295949613 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"am", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"am", "task":"mgsm", "metric":"accuracy", - "score":0.1 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"am", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.8 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"am", "task":"translation_from", "metric":"bleu", - "score":0.0987853648 + "score":0.339375511 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"am", "task":"translation_from", "metric":"chrf", - "score":0.2172965208 + "score":0.566407043 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"am", "task":"translation_to", "metric":"bleu", - "score":0.0037326563 + "score":0.2692320655 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"am", "task":"translation_to", "metric":"chrf", - "score":0.0273289802 + "score":0.3685144367 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"apc", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"apc", "task":"translation_from", "metric":"bleu", - "score":0.0349474752 + "score":0.3872368514 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"apc", "task":"translation_from", "metric":"chrf", - "score":0.205929391 + "score":0.6253206413 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"apc", "task":"translation_to", "metric":"bleu", - "score":0.0109943205 + "score":0.3385588073 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"apc", "task":"translation_to", "metric":"chrf", - "score":0.1135056868 + "score":0.5846751763 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ar", "task":"classification", "metric":"accuracy", - "score":0.1 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ar", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.0231513455 + "score":0.3462011916 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.1669816885 + "score":0.5813984303 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ar", "task":"translation_to", "metric":"bleu", - "score":0.0192052173 + "score":0.4319399394 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ar", "task":"translation_to", "metric":"chrf", - "score":0.1199941852 + "score":0.6269389132 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ary", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ary", "task":"translation_from", "metric":"bleu", - "score":0.0482644911 + "score":0.2181205299 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ary", "task":"translation_from", "metric":"chrf", - "score":0.1570610957 + "score":0.4844955734 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ary", "task":"translation_to", "metric":"bleu", - "score":0.0 + "score":0.2033199109 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ary", "task":"translation_to", "metric":"chrf", - "score":0.0671140896 + "score":0.4375696019 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"arz", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"arz", "task":"translation_from", "metric":"bleu", - "score":0.0333540125 + "score":0.2639599801 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"arz", "task":"translation_from", "metric":"chrf", - "score":0.1654807425 + "score":0.4789807253 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"arz", "task":"translation_to", "metric":"bleu", - "score":0.0300458941 + "score":0.2907084686 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"arz", "task":"translation_to", "metric":"chrf", - "score":0.1417391491 + "score":0.4882539682 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"as", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"as", "task":"translation_from", "metric":"bleu", - "score":0.0153668157 + "score":0.3118761994 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"as", "task":"translation_from", "metric":"chrf", - "score":0.1119995149 + "score":0.5439623542 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"as", "task":"translation_to", "metric":"bleu", - "score":0.0988733729 + "score":0.243905252 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"as", "task":"translation_to", "metric":"chrf", - "score":0.2096173766 + "score":0.4730608179 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"awa", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"awa", "task":"translation_from", "metric":"bleu", - "score":0.0696643378 + "score":0.40510024 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"awa", "task":"translation_from", "metric":"chrf", - "score":0.1931858455 + "score":0.6210515689 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"awa", "task":"translation_to", "metric":"bleu", - "score":0.0309816185 + "score":0.2510210672 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"awa", "task":"translation_to", "metric":"chrf", - "score":0.1018697927 + "score":0.4814090379 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"az", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"az", "task":"translation_from", "metric":"bleu", - "score":0.0634083235 + "score":0.3101513593 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"az", "task":"translation_from", "metric":"chrf", - "score":0.1819427877 + "score":0.5253923906 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"az", "task":"translation_to", "metric":"bleu", - "score":0.0728528728 + "score":0.216177525 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"az", "task":"translation_to", "metric":"chrf", - "score":0.2068099712 + "score":0.4555999734 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"be", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"be", "task":"translation_from", "metric":"bleu", - "score":0.0726648889 + "score":0.2142226733 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"be", "task":"translation_from", "metric":"chrf", - "score":0.2430791182 + "score":0.5048792464 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"be", "task":"translation_to", "metric":"bleu", - "score":0.0528414924 + "score":0.3216771298 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"be", "task":"translation_to", "metric":"chrf", - "score":0.1724803068 + "score":0.5056511666 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"bho", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"bho", "task":"translation_from", "metric":"bleu", - "score":0.1903946317 + "score":0.3246124272 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"bho", "task":"translation_from", "metric":"chrf", - "score":0.3145924631 + "score":0.5547058357 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"bho", "task":"translation_to", "metric":"bleu", - "score":0.0 + "score":0.2300858071 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"bho", "task":"translation_to", "metric":"chrf", - "score":0.0310651444 + "score":0.4391471287 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"bm", "task":"classification", "metric":"accuracy", "score":0.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"bm", "task":"translation_from", "metric":"bleu", "score":0.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"bm", "task":"translation_from", "metric":"chrf", "score":0.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"bm", "task":"translation_to", "metric":"bleu", "score":0.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"bm", "task":"translation_to", "metric":"chrf", "score":0.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"bn", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"bn", "task":"mgsm", "metric":"accuracy", - "score":0.3 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"bn", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.0425897525 + "score":0.3332105938 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.1329517484 + "score":0.5788748413 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"bn", "task":"translation_to", "metric":"bleu", - "score":0.1071842556 + "score":0.3925309816 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"bn", "task":"translation_to", "metric":"chrf", - "score":0.2292182808 + "score":0.5671456285 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ca", "task":"classification", "metric":"accuracy", "score":0.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ca", "task":"translation_from", "metric":"bleu", "score":0.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ca", "task":"translation_from", "metric":"chrf", "score":0.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ca", "task":"translation_to", "metric":"bleu", "score":0.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ca", "task":"translation_to", "metric":"chrf", "score":0.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ceb", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ceb", "task":"translation_from", "metric":"bleu", - "score":0.1295041316 + "score":0.4667759574 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ceb", "task":"translation_from", "metric":"chrf", - "score":0.2647572228 + "score":0.6329355142 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ceb", "task":"translation_to", "metric":"bleu", - "score":0.0551171959 + "score":0.4086791428 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ceb", "task":"translation_to", "metric":"chrf", - "score":0.2019792449 + "score":0.6523845508 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ckb", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ckb", "task":"translation_from", "metric":"bleu", - "score":0.1181725504 + "score":0.3593703137 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ckb", "task":"translation_from", "metric":"chrf", - "score":0.3417239653 + "score":0.6131084436 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ckb", "task":"translation_to", "metric":"bleu", - "score":0.0030057917 + "score":0.349617489 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ckb", "task":"translation_to", "metric":"chrf", - "score":0.050016858 + "score":0.5888504157 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"cs", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"cs", "task":"mgsm", "metric":"accuracy", - "score":0.1 + "score":0.8 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"cs", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"cs", "task":"translation_from", "metric":"bleu", - "score":0.1106488773 + "score":0.4190817149 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"cs", "task":"translation_from", "metric":"chrf", - "score":0.2661126449 + "score":0.633614654 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"cs", "task":"translation_to", "metric":"bleu", - "score":0.0566112691 + "score":0.3332466044 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"cs", "task":"translation_to", "metric":"chrf", - "score":0.2161355093 + "score":0.5272130276 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"de", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"de", "task":"mgsm", "metric":"accuracy", - "score":0.3 + "score":0.8 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"de", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.1071586446 + "score":0.4080538745 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.2867516145 + "score":0.6278026445 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"de", "task":"translation_to", "metric":"bleu", - "score":0.1380160311 + "score":0.4940498755 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"de", "task":"translation_to", "metric":"chrf", - "score":0.3472666619 + "score":0.6915113583 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"el", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"el", "task":"mgsm", "metric":"accuracy", - "score":0.1 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"el", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.7 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"el", "task":"translation_from", "metric":"bleu", - "score":0.1228102479 + "score":0.3680077775 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"el", "task":"translation_from", "metric":"chrf", - "score":0.257059719 + "score":0.5798463116 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"el", "task":"translation_to", "metric":"bleu", - "score":0.0709906394 + "score":0.4003636095 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"el", "task":"translation_to", "metric":"chrf", - "score":0.1615768924 + "score":0.5747287276 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"en", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"en", "task":"mgsm", "metric":"accuracy", - "score":0.5 + "score":0.8 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"en", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.3271580119 + "score":0.5780592594 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.4059591673 + "score":0.727062887 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"en", "task":"translation_to", "metric":"bleu", - "score":0.4705724484 + "score":0.725042796 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"en", "task":"translation_to", "metric":"chrf", - "score":0.5810510479 + "score":0.868453404 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"es", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"es", "task":"mgsm", "metric":"accuracy", - "score":0.5 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"es", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.7 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.0612440394 + "score":0.3228577771 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.214820597 + "score":0.5691176688 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"es", "task":"translation_to", "metric":"bleu", - "score":0.0718408174 + "score":0.4211069488 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"es", "task":"translation_to", "metric":"chrf", - "score":0.2974455623 + "score":0.6329026504 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"fa", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"fa", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"fa", "task":"translation_from", "metric":"bleu", - "score":0.1093307519 + "score":0.3659700454 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"fa", "task":"translation_from", "metric":"chrf", - "score":0.2212819207 + "score":0.5807664259 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"fa", "task":"translation_to", "metric":"bleu", - "score":0.0461058798 + "score":0.2252471667 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"fa", "task":"translation_to", "metric":"chrf", - "score":0.1370841628 + "score":0.4480100347 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"fil", "task":"classification", "metric":"accuracy", - "score":0.1 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"fil", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.8 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"fil", "task":"translation_from", "metric":"bleu", - "score":0.1005924157 + "score":0.447799796 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"fil", "task":"translation_from", "metric":"chrf", - "score":0.202708484 + "score":0.6437494805 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"fil", "task":"translation_to", "metric":"bleu", - "score":0.0160833262 + "score":0.318387966 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"fil", "task":"translation_to", "metric":"chrf", - "score":0.1960110619 + "score":0.6173467767 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"fr", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"fr", "task":"mgsm", "metric":"accuracy", - "score":0.4 + "score":0.7 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"fr", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.1269813968 + "score":0.3683003934 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.3065913664 + "score":0.5961800274 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"fr", "task":"translation_to", "metric":"bleu", - "score":0.1789987295 + "score":0.5899042948 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"fr", "task":"translation_to", "metric":"chrf", - "score":0.3463028707 + "score":0.7506595836 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"fuv", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"fuv", "task":"translation_from", "metric":"bleu", - "score":0.014745965 + "score":0.0858271085 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"fuv", "task":"translation_from", "metric":"chrf", - "score":0.0749091363 + "score":0.2495672773 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"fuv", "task":"translation_to", "metric":"bleu", - "score":0.0 + "score":0.0320352537 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"fuv", "task":"translation_to", "metric":"chrf", - "score":0.0895914252 + "score":0.2006317654 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"gu", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"gu", "task":"translation_from", "metric":"bleu", - "score":0.097971755 + "score":0.3793081536 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"gu", "task":"translation_from", "metric":"chrf", - "score":0.1777195033 + "score":0.5865031052 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"gu", "task":"translation_to", "metric":"bleu", - "score":0.0318870555 + "score":0.2344717249 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"gu", "task":"translation_to", "metric":"chrf", - "score":0.1529629731 + "score":0.4873543825 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ha", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ha", "task":"mgsm", "metric":"accuracy", - "score":0.3 + "score":0.5 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ha", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ha", "task":"translation_from", "metric":"bleu", - "score":0.0369448389 + "score":0.3157236901 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ha", "task":"translation_from", "metric":"chrf", - "score":0.1480560277 + "score":0.5365403784 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ha", "task":"translation_to", "metric":"bleu", - "score":0.0919802251 + "score":0.3221592053 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ha", "task":"translation_to", "metric":"chrf", - "score":0.2629251679 + "score":0.565816945 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"hi", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"hi", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.2538230452 + "score":0.4661333335 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.3759994265 + "score":0.6599650679 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"hi", "task":"translation_to", "metric":"bleu", - "score":0.0835774684 + "score":0.4319599559 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"hi", "task":"translation_to", "metric":"chrf", - "score":0.1904298158 + "score":0.6493733048 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"hne", "task":"classification", "metric":"accuracy", - "score":0.1 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"hne", "task":"translation_from", "metric":"bleu", - "score":0.0800273183 + "score":0.3345560794 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"hne", "task":"translation_from", "metric":"chrf", - "score":0.2260677118 + "score":0.5782385873 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"hne", "task":"translation_to", "metric":"bleu", - "score":0.0220446366 + "score":0.1623642047 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"hne", "task":"translation_to", "metric":"chrf", - "score":0.0997285023 + "score":0.4427298342 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ht", "task":"classification", "metric":"accuracy", "score":0.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ht", "task":"translation_from", "metric":"bleu", "score":0.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ht", "task":"translation_from", "metric":"chrf", "score":0.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ht", "task":"translation_to", "metric":"bleu", "score":0.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ht", "task":"translation_to", "metric":"chrf", "score":0.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"hu", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"hu", "task":"mgsm", "metric":"accuracy", - "score":0.3 + "score":0.8 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"hu", "task":"translation_from", "metric":"bleu", - "score":0.0883989834 + "score":0.3210417538 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"hu", "task":"translation_from", "metric":"chrf", - "score":0.206785454 + "score":0.5852315407 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"hu", "task":"translation_to", "metric":"bleu", - "score":0.0790692679 + "score":0.4603569586 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"hu", "task":"translation_to", "metric":"chrf", - "score":0.28304649 + "score":0.6610825918 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"id", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"id", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.8 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.0773479102 + "score":0.3507436052 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.2587381281 + "score":0.5856872774 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"id", "task":"translation_to", "metric":"bleu", - "score":0.0433423647 + "score":0.387557065 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"id", "task":"translation_to", "metric":"chrf", - "score":0.2817069358 + "score":0.6730969345 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ig", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ig", "task":"mgsm", "metric":"accuracy", - "score":0.1 + "score":0.7 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ig", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ig", "task":"translation_from", "metric":"bleu", - "score":0.0612163002 + "score":0.283991055 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ig", "task":"translation_from", "metric":"chrf", - "score":0.2381342912 + "score":0.5165825783 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ig", "task":"translation_to", "metric":"bleu", - "score":0.0426402139 + "score":0.297494689 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ig", "task":"translation_to", "metric":"chrf", - "score":0.1696737174 + "score":0.5366364022 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ilo", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ilo", "task":"translation_from", "metric":"bleu", - "score":0.0970247032 + "score":0.3679312463 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ilo", "task":"translation_from", "metric":"chrf", - "score":0.2111718332 + "score":0.5717815434 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ilo", "task":"translation_to", "metric":"bleu", - "score":0.0050070462 + "score":0.2293183432 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ilo", "task":"translation_to", "metric":"chrf", - "score":0.1683969558 + "score":0.5172904845 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"it", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"it", "task":"mgsm", "metric":"accuracy", - "score":0.4 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"it", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.6 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"it", "task":"translation_from", "metric":"bleu", - "score":0.139001615 + "score":0.3498261827 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"it", "task":"translation_from", "metric":"chrf", - "score":0.2668336456 + "score":0.5707332142 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"it", "task":"translation_to", "metric":"bleu", - "score":0.0475935646 + "score":0.35475083 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"it", "task":"translation_to", "metric":"chrf", - "score":0.2602541027 + "score":0.5942822113 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ja", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ja", "task":"mgsm", "metric":"accuracy", - "score":0.4 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ja", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.7 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.0609909305 + "score":0.3590987818 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.1860226608 + "score":0.5958999814 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ja", "task":"translation_to", "metric":"bleu", - "score":0.0692256682 + "score":0.4151803591 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ja", "task":"translation_to", "metric":"chrf", - "score":0.1449932716 + "score":0.5319028037 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"jv", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.0495085803 + "score":0.3793672083 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.1459303026 + "score":0.6054760312 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"jv", "task":"translation_to", "metric":"bleu", - "score":0.0098682093 + "score":0.3161702144 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"jv", "task":"translation_to", "metric":"chrf", - "score":0.1292642853 + "score":0.5956895972 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ki", "task":"classification", "metric":"accuracy", "score":0.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ki", "task":"translation_from", "metric":"bleu", "score":0.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ki", "task":"translation_from", "metric":"chrf", "score":0.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ki", "task":"translation_to", "metric":"bleu", "score":0.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ki", "task":"translation_to", "metric":"chrf", "score":0.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"kk", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"kk", "task":"translation_from", "metric":"bleu", - "score":0.0827091376 + "score":0.2948023962 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"kk", "task":"translation_from", "metric":"chrf", - "score":0.2337306985 + "score":0.5499737045 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"kk", "task":"translation_to", "metric":"bleu", - "score":0.0492400989 + "score":0.3612978689 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"kk", "task":"translation_to", "metric":"chrf", - "score":0.155912411 + "score":0.6021186725 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"km", "task":"classification", "metric":"accuracy", - "score":0.1 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"km", "task":"translation_from", "metric":"bleu", - "score":0.0860125484 + "score":0.3644204358 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"km", "task":"translation_from", "metric":"chrf", - "score":0.1623830923 + "score":0.5994539632 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"km", "task":"translation_to", "metric":"bleu", - "score":0.0024514101 + "score":0.2065208646 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"km", "task":"translation_to", "metric":"chrf", - "score":0.0781695805 + "score":0.4474063783 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"kn", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"kn", "task":"translation_from", "metric":"bleu", - "score":0.0937784828 + "score":0.3051972526 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"kn", "task":"translation_from", "metric":"chrf", - "score":0.2195953032 + "score":0.5542686332 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"kn", "task":"translation_to", "metric":"bleu", - "score":0.0577688436 + "score":0.3567486129 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"kn", "task":"translation_to", "metric":"chrf", - "score":0.1510063998 + "score":0.5611431734 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ko", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ko", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.7 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ko", "task":"translation_from", "metric":"bleu", - "score":0.0680252346 + "score":0.2872143997 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ko", "task":"translation_from", "metric":"chrf", - "score":0.2091636742 + "score":0.5525223441 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ko", "task":"translation_to", "metric":"bleu", - "score":0.0555477009 + "score":0.3116476133 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ko", "task":"translation_to", "metric":"chrf", - "score":0.0549298013 + "score":0.3648802199 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"lua", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"lua", "task":"translation_from", "metric":"bleu", - "score":0.0036630043 + "score":0.1399233592 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"lua", "task":"translation_from", "metric":"chrf", - "score":0.099240382 + "score":0.315099285 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"lua", "task":"translation_to", "metric":"bleu", - "score":0.0532977337 + "score":0.0802015694 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"lua", "task":"translation_to", "metric":"chrf", - "score":0.2153600503 + "score":0.3631437635 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"mag", "task":"classification", "metric":"accuracy", - "score":0.1 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"mag", "task":"translation_from", "metric":"bleu", - "score":0.1425685645 + "score":0.4128862434 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"mag", "task":"translation_from", "metric":"chrf", - "score":0.3016796517 + "score":0.6274466843 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"mag", "task":"translation_to", "metric":"bleu", - "score":0.0118929014 + "score":0.3688684574 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"mag", "task":"translation_to", "metric":"chrf", - "score":0.0840825564 + "score":0.5833102178 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"mai", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"mai", "task":"translation_from", "metric":"bleu", - "score":0.115229855 + "score":0.3890840766 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"mai", "task":"translation_from", "metric":"chrf", - "score":0.2180450998 + "score":0.6240476873 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"mai", "task":"translation_to", "metric":"bleu", - "score":0.0163179059 + "score":0.2256501556 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"mai", "task":"translation_to", "metric":"chrf", - "score":0.0417840087 + "score":0.4794729055 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"mg", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"mg", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.8 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"mg", "task":"translation_from", "metric":"bleu", - "score":0.0410364581 + "score":0.3701671266 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"mg", "task":"translation_from", "metric":"chrf", - "score":0.2193286405 + "score":0.5789314386 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"mg", "task":"translation_to", "metric":"bleu", - "score":0.0422799242 + "score":0.2339248832 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"mg", "task":"translation_to", "metric":"chrf", - "score":0.1425526516 + "score":0.5444701317 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ml", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ml", "task":"translation_from", "metric":"bleu", - "score":0.0630918824 + "score":0.4065449181 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ml", "task":"translation_from", "metric":"chrf", - "score":0.1710971727 + "score":0.6069224309 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ml", "task":"translation_to", "metric":"bleu", - "score":0.0386225926 + "score":0.3084108149 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ml", "task":"translation_to", "metric":"chrf", - "score":0.1445595523 + "score":0.5610104654 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"mr", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.1084731704 + "score":0.2888720948 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.2498733805 + "score":0.5411662197 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"mr", "task":"translation_to", "metric":"bleu", - "score":0.0 + "score":0.2820351359 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"mr", "task":"translation_to", "metric":"chrf", - "score":0.0399406962 + "score":0.5017455952 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ms", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ms", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.8 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ms", "task":"translation_from", "metric":"bleu", - "score":0.033427329 + "score":0.4137133794 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ms", "task":"translation_from", "metric":"chrf", - "score":0.1616696801 + "score":0.6312868188 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ms", "task":"translation_to", "metric":"bleu", - "score":0.115786224 + "score":0.4812654706 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ms", "task":"translation_to", "metric":"chrf", - "score":0.3018549986 + "score":0.7314221816 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"my", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"my", "task":"translation_from", "metric":"bleu", - "score":0.2294643956 + "score":0.3696810103 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"my", "task":"translation_from", "metric":"chrf", - "score":0.3457333311 + "score":0.5941720939 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"my", "task":"translation_to", "metric":"bleu", - "score":0.1065767565 + "score":0.3374140159 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"my", "task":"translation_to", "metric":"chrf", - "score":0.2047469752 + "score":0.5598126987 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ne", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ne", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.8 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ne", "task":"translation_from", "metric":"bleu", - "score":0.0951128399 + "score":0.3690975587 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ne", "task":"translation_from", "metric":"chrf", - "score":0.2178534884 + "score":0.591186642 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ne", "task":"translation_to", "metric":"bleu", - "score":0.0398161454 + "score":0.2727284255 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ne", "task":"translation_to", "metric":"chrf", - "score":0.1412294262 + "score":0.4816401296 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"nl", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"nl", "task":"mgsm", "metric":"accuracy", - "score":0.3 + "score":0.8 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"nl", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.8 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"nl", "task":"translation_from", "metric":"bleu", - "score":0.0563796721 + "score":0.3099744217 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"nl", "task":"translation_from", "metric":"chrf", - "score":0.1918127836 + "score":0.5540665201 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"nl", "task":"translation_to", "metric":"bleu", - "score":0.0887408505 + "score":0.358350435 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"nl", "task":"translation_to", "metric":"chrf", - "score":0.3444852597 + "score":0.6375438913 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ny", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ny", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.8 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ny", "task":"translation_from", "metric":"bleu", - "score":0.0322569074 + "score":0.2769742108 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ny", "task":"translation_from", "metric":"chrf", - "score":0.1681655692 + "score":0.5127880962 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ny", "task":"translation_to", "metric":"bleu", - "score":0.0133097605 + "score":0.1953053994 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ny", "task":"translation_to", "metric":"chrf", - "score":0.1890356187 + "score":0.5454095128 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"om", "task":"classification", "metric":"accuracy", - "score":0.1 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"om", "task":"mgsm", "metric":"accuracy", - "score":0.1 + "score":0.4 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"om", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"om", "task":"translation_from", "metric":"bleu", - "score":0.0380467697 + "score":0.1552982789 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"om", "task":"translation_from", "metric":"chrf", - "score":0.11665963 + "score":0.4088650794 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"om", "task":"translation_to", "metric":"bleu", - "score":0.0196821089 + "score":0.0578542594 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"om", "task":"translation_to", "metric":"chrf", - "score":0.1887330103 + "score":0.4227186624 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"or", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"or", "task":"translation_from", "metric":"bleu", - "score":0.0987048471 + "score":0.3491547876 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"or", "task":"translation_from", "metric":"chrf", - "score":0.2474195062 + "score":0.6003545703 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"or", "task":"translation_to", "metric":"bleu", - "score":0.0246921682 + "score":0.307748028 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"or", "task":"translation_to", "metric":"chrf", - "score":0.1089265139 + "score":0.5199829894 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"pa", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.2220426626 + "score":0.4833653569 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.3598952341 + "score":0.6877252787 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"pa", "task":"translation_to", "metric":"bleu", - "score":0.1611882376 + "score":0.4959043786 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"pa", "task":"translation_to", "metric":"chrf", - "score":0.2396561128 + "score":0.631939007 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"pl", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"pl", "task":"mgsm", "metric":"accuracy", - "score":0.3 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"pl", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.8 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"pl", "task":"translation_from", "metric":"bleu", - "score":0.0904332342 + "score":0.345076722 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"pl", "task":"translation_from", "metric":"chrf", - "score":0.2068730334 + "score":0.5982949848 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"pl", "task":"translation_to", "metric":"bleu", - "score":0.046065351 + "score":0.3888863333 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"pl", "task":"translation_to", "metric":"chrf", - "score":0.1925827805 + "score":0.6077722316 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"pt", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"pt", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.1079576302 + "score":0.4185968559 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.2645017017 + "score":0.6194298291 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.0569295003 + "score":0.5066913819 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.2615431845 + "score":0.7045563325 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ro", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ro", "task":"mgsm", "metric":"accuracy", - "score":0.4 + "score":0.7 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ro", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ro", "task":"translation_from", "metric":"bleu", - "score":0.131593328 + "score":0.3510540475 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ro", "task":"translation_from", "metric":"chrf", - "score":0.3060223321 + "score":0.5985634799 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ro", "task":"translation_to", "metric":"bleu", - "score":0.0757294413 + "score":0.5670740367 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ro", "task":"translation_to", "metric":"chrf", - "score":0.2150897212 + "score":0.7258358589 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ru", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ru", "task":"mgsm", "metric":"accuracy", - "score":0.3 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ru", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.0926690761 + "score":0.2835606416 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.2397253952 + "score":0.5525332546 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ru", "task":"translation_to", "metric":"bleu", - "score":0.1044259789 + "score":0.5294387768 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ru", "task":"translation_to", "metric":"chrf", - "score":0.236302624 + "score":0.6814959444 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"rw", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"rw", "task":"mgsm", "metric":"accuracy", - "score":0.2 + "score":0.5 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"rw", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.8 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"rw", "task":"translation_from", "metric":"bleu", - "score":0.0153852885 + "score":0.315385923 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"rw", "task":"translation_from", "metric":"chrf", - "score":0.1605190155 + "score":0.5485214208 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"rw", "task":"translation_to", "metric":"bleu", - "score":0.0600552316 + "score":0.3039027455 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"rw", "task":"translation_to", "metric":"chrf", - "score":0.2182309051 + "score":0.5685019601 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sd", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sd", "task":"translation_from", "metric":"bleu", - "score":0.120327349 + "score":0.4019575944 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sd", "task":"translation_from", "metric":"chrf", - "score":0.2042820289 + "score":0.6276858351 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sd", "task":"translation_to", "metric":"bleu", - "score":0.0309396387 + "score":0.3830695907 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sd", "task":"translation_to", "metric":"chrf", - "score":0.1043645846 + "score":0.5452929704 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"si", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"si", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.8 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"si", "task":"translation_from", "metric":"bleu", - "score":0.0861987344 + "score":0.3256641934 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"si", "task":"translation_from", "metric":"chrf", - "score":0.2079338406 + "score":0.5531574071 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"si", "task":"translation_to", "metric":"bleu", - "score":0.0196434254 + "score":0.3465036043 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"si", "task":"translation_to", "metric":"chrf", - "score":0.0610643505 + "score":0.5339014715 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sn", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sn", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":0.7 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sn", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sn", "task":"translation_from", "metric":"bleu", - "score":0.0320247445 + "score":0.2148918029 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sn", "task":"translation_from", "metric":"chrf", - "score":0.2176774161 + "score":0.4431856714 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sn", "task":"translation_to", "metric":"bleu", - "score":0.0700005142 + "score":0.2048159746 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sn", "task":"translation_to", "metric":"chrf", - "score":0.1952413901 + "score":0.5229910344 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"so", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"so", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.8 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"so", "task":"translation_from", "metric":"bleu", - "score":0.0252575003 + "score":0.3102660748 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"so", "task":"translation_from", "metric":"chrf", - "score":0.157057904 + "score":0.5202647222 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"so", "task":"translation_to", "metric":"bleu", - "score":0.0629444831 + "score":0.2456069778 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"so", "task":"translation_to", "metric":"chrf", - "score":0.1833979697 + "score":0.503324615 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sr", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sr", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sr", "task":"translation_from", "metric":"bleu", - "score":0.0868186974 + "score":0.3298581842 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sr", "task":"translation_from", "metric":"chrf", - "score":0.2586575848 + "score":0.5870517038 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sr", "task":"translation_to", "metric":"bleu", - "score":0.1093378877 + "score":0.4507987284 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sr", "task":"translation_to", "metric":"chrf", - "score":0.2502315423 + "score":0.6306764686 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"su", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"su", "task":"translation_from", "metric":"bleu", - "score":0.0782352762 + "score":0.3438400948 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"su", "task":"translation_from", "metric":"chrf", - "score":0.2378174872 + "score":0.5431534783 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"su", "task":"translation_to", "metric":"bleu", - "score":0.0338179306 + "score":0.2185629205 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"su", "task":"translation_to", "metric":"chrf", - "score":0.2284098709 + "score":0.513335728 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sv", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sv", "task":"mgsm", "metric":"accuracy", - "score":0.2 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sv", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.8 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sv", "task":"translation_from", "metric":"bleu", - "score":0.1179976804 + "score":0.3332298772 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sv", "task":"translation_from", "metric":"chrf", - "score":0.2633320797 + "score":0.5774389783 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sv", "task":"translation_to", "metric":"bleu", - "score":0.0494945427 + "score":0.4778984127 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sv", "task":"translation_to", "metric":"chrf", - "score":0.2411403917 + "score":0.6958168144 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sw", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sw", "task":"mgsm", "metric":"accuracy", - "score":0.1 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sw", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.1282740208 + "score":0.4452506057 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.2521886667 + "score":0.6299322033 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sw", "task":"translation_to", "metric":"bleu", - "score":0.0748708455 + "score":0.4773237879 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"sw", "task":"translation_to", "metric":"chrf", - "score":0.2420611826 + "score":0.6983325706 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ta", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ta", "task":"translation_from", "metric":"bleu", - "score":0.1073230839 + "score":0.2765535661 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ta", "task":"translation_from", "metric":"chrf", - "score":0.1798254279 + "score":0.5553462948 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ta", "task":"translation_to", "metric":"bleu", - "score":0.0317538654 + "score":0.3584530222 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ta", "task":"translation_to", "metric":"chrf", - "score":0.2038003362 + "score":0.6096517359 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"te", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"te", "task":"mgsm", "metric":"accuracy", - "score":0.2 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"te", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.8 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.1951561832 + "score":0.4838983303 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.3697480899 + "score":0.6878651593 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"te", "task":"translation_to", "metric":"bleu", - "score":0.1899598166 + "score":0.4225689448 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"te", "task":"translation_to", "metric":"chrf", - "score":0.2894416622 + "score":0.6171822766 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"tg", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"tg", "task":"translation_from", "metric":"bleu", - "score":0.0653258846 + "score":0.2905859261 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"tg", "task":"translation_from", "metric":"chrf", - "score":0.2205970586 + "score":0.5219303661 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"tg", "task":"translation_to", "metric":"bleu", - "score":0.0222271283 + "score":0.3215838806 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"tg", "task":"translation_to", "metric":"chrf", - "score":0.120000505 + "score":0.5332721729 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"th", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"th", "task":"mgsm", "metric":"accuracy", - "score":0.4 + "score":0.8 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"th", "task":"translation_from", "metric":"bleu", - "score":0.1262768628 + "score":0.363389223 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"th", "task":"translation_from", "metric":"chrf", - "score":0.2570885899 + "score":0.5927603201 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"th", "task":"translation_to", "metric":"bleu", - "score":0.0575688551 + "score":0.4280908922 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"th", "task":"translation_to", "metric":"chrf", - "score":0.1582234491 + "score":0.5695430758 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ti", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ti", "task":"translation_from", "metric":"bleu", - "score":0.0 + "score":0.2870643832 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ti", "task":"translation_from", "metric":"chrf", - "score":0.062613791 + "score":0.5217258722 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ti", "task":"translation_to", "metric":"bleu", - "score":0.0059519046 + "score":0.1683718664 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ti", "task":"translation_to", "metric":"chrf", - "score":0.0274291267 + "score":0.2689944739 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"tr", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"tr", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.8 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"tr", "task":"translation_from", "metric":"bleu", - "score":0.0337787053 + "score":0.3532965173 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"tr", "task":"translation_from", "metric":"chrf", - "score":0.1824544035 + "score":0.6170908018 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"tr", "task":"translation_to", "metric":"bleu", - "score":0.1405643754 + "score":0.4401941591 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"tr", "task":"translation_to", "metric":"chrf", - "score":0.281387297 + "score":0.6752054069 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"uk", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"uk", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"uk", "task":"translation_from", "metric":"bleu", - "score":0.1091041441 + "score":0.3183568029 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"uk", "task":"translation_from", "metric":"chrf", - "score":0.2184696361 + "score":0.569783479 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"uk", "task":"translation_to", "metric":"bleu", - "score":0.1508474535 + "score":0.4278428166 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"uk", "task":"translation_to", "metric":"chrf", - "score":0.234056096 + "score":0.6040719448 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"umb", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.8 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"umb", "task":"translation_from", "metric":"bleu", - "score":0.0058005929 + "score":0.037144113 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"umb", "task":"translation_from", "metric":"chrf", - "score":0.0841095708 + "score":0.089331464 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"umb", "task":"translation_to", "metric":"bleu", - "score":0.0 + "score":0.0447156552 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"umb", "task":"translation_to", "metric":"chrf", - "score":0.1328221884 + "score":0.2228994735 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ur", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":0.1386027419 + "score":0.3194163699 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":0.3084595255 + "score":0.5758075077 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ur", "task":"translation_to", "metric":"bleu", - "score":0.0167447692 + "score":0.2609063103 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"ur", "task":"translation_to", "metric":"chrf", - "score":0.0960347815 + "score":0.4351160146 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"uz", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"uz", "task":"translation_from", "metric":"bleu", - "score":0.0342337572 + "score":0.3488574237 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"uz", "task":"translation_from", "metric":"chrf", - "score":0.1153353221 + "score":0.5833892626 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"uz", "task":"translation_to", "metric":"bleu", - "score":0.0694684605 + "score":0.3525318348 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"uz", "task":"translation_to", "metric":"chrf", - "score":0.2369528571 + "score":0.600901419 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"vi", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"vi", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.1615259525 + "score":0.4227968054 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.2808117936 + "score":0.6326522416 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"vi", "task":"translation_to", "metric":"bleu", - "score":0.1251511875 + "score":0.4693432911 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"vi", "task":"translation_to", "metric":"chrf", - "score":0.3058766946 + "score":0.6659480306 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"wo", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"wo", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":0.3 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"wo", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.5 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"wo", "task":"translation_from", "metric":"bleu", - "score":0.0065958006 + "score":0.1552091518 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"wo", "task":"translation_from", "metric":"chrf", - "score":0.0642484091 + "score":0.3984533183 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"wo", "task":"translation_to", "metric":"bleu", - "score":0.0043862302 + "score":0.0934433089 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"wo", "task":"translation_to", "metric":"chrf", - "score":0.1616631945 + "score":0.3362523248 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"wuu", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"wuu", "task":"translation_from", "metric":"bleu", - "score":0.0666328001 + "score":0.3241760602 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"wuu", "task":"translation_from", "metric":"chrf", - "score":0.2282939681 + "score":0.5694459727 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"wuu", "task":"translation_to", "metric":"bleu", - "score":0.0063550665 + "score":0.1373684835 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"wuu", "task":"translation_to", "metric":"chrf", - "score":0.0402314549 + "score":0.1808455778 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"xh", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"xh", "task":"mgsm", "metric":"accuracy", - "score":0.1 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"xh", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"xh", "task":"translation_from", "metric":"bleu", - "score":0.0731036446 + "score":0.2594184267 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"xh", "task":"translation_from", "metric":"chrf", - "score":0.1810894045 + "score":0.4970898641 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"xh", "task":"translation_to", "metric":"bleu", - "score":0.0117190064 + "score":0.1342973002 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"xh", "task":"translation_to", "metric":"chrf", - "score":0.1631103727 + "score":0.4760810578 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"yo", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"yo", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":0.6 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"yo", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.7 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"yo", "task":"translation_from", "metric":"bleu", - "score":0.058648798 + "score":0.1670055121 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"yo", "task":"translation_from", "metric":"chrf", - "score":0.162917811 + "score":0.3949060751 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"yo", "task":"translation_to", "metric":"bleu", - "score":0.0647492243 + "score":0.1271782927 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"yo", "task":"translation_to", "metric":"chrf", - "score":0.1522863767 + "score":0.2784136749 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"yue", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"yue", "task":"translation_from", "metric":"bleu", - "score":0.1133445002 + "score":0.2666023686 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"yue", "task":"translation_from", "metric":"chrf", - "score":0.2630654346 + "score":0.5200218275 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"yue", "task":"translation_to", "metric":"bleu", - "score":0.0177899901 + "score":0.1881613886 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"yue", "task":"translation_to", "metric":"chrf", - "score":0.0452074918 + "score":0.2877597368 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"zh", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"zh", "task":"mgsm", "metric":"accuracy", - "score":0.5 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"zh", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.0949407188 + "score":0.2632355471 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.2042376654 + "score":0.5527183044 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"zh", "task":"translation_to", "metric":"bleu", - "score":0.0 + "score":0.3128970722 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"zh", "task":"translation_to", "metric":"chrf", - "score":0.0169223477 + "score":0.3699956681 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"zu", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"zu", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":0.6 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"zu", "task":"mmlu", "metric":"accuracy", - "score":0.0 + "score":0.9 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"zu", "task":"translation_from", "metric":"bleu", - "score":0.0689235431 + "score":0.3295494586 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"zu", "task":"translation_from", "metric":"chrf", - "score":0.2000811037 + "score":0.557523684 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"zu", "task":"translation_to", "metric":"bleu", - "score":0.0413489342 + "score":0.3146714644 }, { - "model":"google\/gemini-2.5-pro-preview-05-06", + "model":"google\/gemini-2.5-flash-preview", "bcp_47":"zu", "task":"translation_to", "metric":"chrf", - "score":0.1904482997 + "score":0.5811521396 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"aeb", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"aeb", "task":"translation_from", "metric":"bleu", - "score":0.2073802913 + "score":0.342116281 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"aeb", "task":"translation_from", "metric":"chrf", - "score":0.4889223975 + "score":0.559017125 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"aeb", "task":"translation_to", "metric":"bleu", - "score":0.0840656979 + "score":0.2612038772 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"aeb", "task":"translation_to", "metric":"chrf", - "score":0.3453561943 + "score":0.4610162591 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"af", "task":"classification", "metric":"accuracy", "score":0.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"af", "task":"translation_from", "metric":"bleu", "score":0.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"af", "task":"translation_from", "metric":"chrf", "score":0.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"af", "task":"translation_to", "metric":"bleu", "score":0.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"af", "task":"translation_to", "metric":"chrf", "score":0.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ak", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ak", "task":"mgsm", "metric":"accuracy", - "score":0.2 + "score":0.5 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ak", "task":"mmlu", "metric":"accuracy", - "score":0.2 + "score":0.7 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ak", "task":"translation_from", "metric":"bleu", - "score":0.120094546 + "score":0.2362598693 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ak", "task":"translation_from", "metric":"chrf", - "score":0.3259782194 + "score":0.4567970323 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ak", "task":"translation_to", "metric":"bleu", - "score":0.0974181135 + "score":0.1615485704 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ak", "task":"translation_to", "metric":"chrf", - "score":0.3477814679 + "score":0.4248295507 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"am", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"am", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"am", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"am", "task":"translation_from", "metric":"bleu", - "score":0.2393172056 + "score":0.2883756135 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"am", "task":"translation_from", "metric":"chrf", - "score":0.4971254293 + "score":0.5452929372 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"am", "task":"translation_to", "metric":"bleu", - "score":0.2089212841 + "score":0.2563045907 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"am", "task":"translation_to", "metric":"chrf", - "score":0.3406916002 + "score":0.3587997566 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"apc", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"apc", "task":"translation_from", "metric":"bleu", - "score":0.2712045148 + "score":0.3529391424 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"apc", "task":"translation_from", "metric":"chrf", - "score":0.5477096036 + "score":0.6061230642 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"apc", "task":"translation_to", "metric":"bleu", - "score":0.178052271 + "score":0.3735935027 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"apc", "task":"translation_to", "metric":"chrf", - "score":0.468064885 + "score":0.6118752881 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ar", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ar", "task":"mmlu", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.2747843596 + "score":0.3509446122 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.5519960681 + "score":0.5872861306 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ar", "task":"translation_to", "metric":"bleu", - "score":0.2863967069 + "score":0.4369226272 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ar", "task":"translation_to", "metric":"chrf", - "score":0.5318173199 + "score":0.6357392299 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ary", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ary", "task":"translation_from", "metric":"bleu", - "score":0.1096694862 + "score":0.178647434 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ary", "task":"translation_from", "metric":"chrf", - "score":0.4291604898 + "score":0.459184816 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ary", "task":"translation_to", "metric":"bleu", - "score":0.1630720543 + "score":0.1766325657 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ary", "task":"translation_to", "metric":"chrf", - "score":0.3952400339 + "score":0.42829263 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"arz", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"arz", "task":"translation_from", "metric":"bleu", - "score":0.1892846534 + "score":0.2689181562 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"arz", "task":"translation_from", "metric":"chrf", - "score":0.4212342522 + "score":0.5103302194 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"arz", "task":"translation_to", "metric":"bleu", - "score":0.1938470016 + "score":0.2811045733 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"arz", "task":"translation_to", "metric":"chrf", - "score":0.4527968539 + "score":0.4796679654 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"as", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"as", "task":"translation_from", "metric":"bleu", - "score":0.2094379574 + "score":0.302725237 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"as", "task":"translation_from", "metric":"chrf", - "score":0.4509809217 + "score":0.542445303 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"as", "task":"translation_to", "metric":"bleu", - "score":0.1931386564 + "score":0.2074435657 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"as", "task":"translation_to", "metric":"chrf", - "score":0.4233010233 + "score":0.4358785934 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"awa", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"awa", "task":"translation_from", "metric":"bleu", - "score":0.2957522582 + "score":0.3306584572 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"awa", "task":"translation_from", "metric":"chrf", - "score":0.5232039352 + "score":0.5470737398 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"awa", "task":"translation_to", "metric":"bleu", - "score":0.2308361669 + "score":0.1839015438 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"awa", "task":"translation_to", "metric":"chrf", - "score":0.4087255612 + "score":0.3995221223 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"az", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"az", "task":"translation_from", "metric":"bleu", - "score":0.200456445 + "score":0.2402619776 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"az", "task":"translation_from", "metric":"chrf", - "score":0.4226152307 + "score":0.4816842061 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"az", "task":"translation_to", "metric":"bleu", - "score":0.1414132922 + "score":0.2017479595 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"az", "task":"translation_to", "metric":"chrf", - "score":0.4170843853 + "score":0.4438028104 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"be", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"be", "task":"translation_from", "metric":"bleu", - "score":0.18522743 + "score":0.1964434077 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"be", "task":"translation_from", "metric":"chrf", - "score":0.4467570037 + "score":0.4658109118 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"be", "task":"translation_to", "metric":"bleu", - "score":0.2590661095 + "score":0.3578761246 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"be", "task":"translation_to", "metric":"chrf", - "score":0.4657468506 + "score":0.5250650323 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"bho", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"bho", "task":"translation_from", "metric":"bleu", - "score":0.2663307677 + "score":0.3118354834 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"bho", "task":"translation_from", "metric":"chrf", - "score":0.519985227 + "score":0.5301057957 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"bho", "task":"translation_to", "metric":"bleu", - "score":0.1913577407 + "score":0.2712094702 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"bho", "task":"translation_to", "metric":"chrf", - "score":0.4064669591 + "score":0.4554148161 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"bm", "task":"classification", "metric":"accuracy", "score":0.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"bm", "task":"translation_from", "metric":"bleu", "score":0.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"bm", "task":"translation_from", "metric":"chrf", "score":0.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"bm", "task":"translation_to", "metric":"bleu", "score":0.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"bm", "task":"translation_to", "metric":"chrf", "score":0.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"bn", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"bn", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.5 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"bn", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.271237739 + "score":0.2928560114 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.5173954387 + "score":0.5373877759 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"bn", "task":"translation_to", "metric":"bleu", - "score":0.3067537945 + "score":0.371713483 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"bn", "task":"translation_to", "metric":"chrf", - "score":0.5194482945 + "score":0.5467648432 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ca", "task":"classification", "metric":"accuracy", "score":0.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ca", "task":"translation_from", "metric":"bleu", "score":0.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ca", "task":"translation_from", "metric":"chrf", "score":0.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ca", "task":"translation_to", "metric":"bleu", "score":0.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ca", "task":"translation_to", "metric":"chrf", "score":0.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ceb", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ceb", "task":"translation_from", "metric":"bleu", - "score":0.3694979709 + "score":0.4167458111 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ceb", "task":"translation_from", "metric":"chrf", - "score":0.59081536 + "score":0.6414773714 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ceb", "task":"translation_to", "metric":"bleu", - "score":0.374702944 + "score":0.4574369641 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ceb", "task":"translation_to", "metric":"chrf", - "score":0.6019503341 + "score":0.6642298649 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ckb", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ckb", "task":"translation_from", "metric":"bleu", - "score":0.2792699678 + "score":0.3171272191 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ckb", "task":"translation_from", "metric":"chrf", - "score":0.5157552806 + "score":0.5378911972 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ckb", "task":"translation_to", "metric":"bleu", - "score":0.2334415639 + "score":0.3576320675 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ckb", "task":"translation_to", "metric":"chrf", - "score":0.5128705295 + "score":0.5996552124 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"cs", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"cs", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.7 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"cs", "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"cs", "task":"translation_from", "metric":"bleu", - "score":0.3536861453 + "score":0.3763167038 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"cs", "task":"translation_from", "metric":"chrf", - "score":0.6024608455 + "score":0.6069984198 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"cs", "task":"translation_to", "metric":"bleu", - "score":0.4031829559 + "score":0.412011399 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"cs", "task":"translation_to", "metric":"chrf", - "score":0.6234553711 + "score":0.5948875971 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"de", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"de", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.3 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"de", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.3189602129 + "score":0.3827187056 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.5548503533 + "score":0.6092943987 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"de", "task":"translation_to", "metric":"bleu", - "score":0.5229096392 + "score":0.5181328066 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"de", "task":"translation_to", "metric":"chrf", - "score":0.7023434262 + "score":0.6981190119 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"el", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"el", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"el", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"el", "task":"translation_from", "metric":"bleu", - "score":0.3137252517 + "score":0.3297475202 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"el", "task":"translation_from", "metric":"chrf", - "score":0.5147981205 + "score":0.5587828835 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"el", "task":"translation_to", "metric":"bleu", - "score":0.3302929673 + "score":0.3865296224 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"el", "task":"translation_to", "metric":"chrf", - "score":0.505425141 + "score":0.5630460332 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"en", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"en", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.1 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"en", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.3889146477 + "score":0.5942868447 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.628092835 + "score":0.7298379077 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"en", "task":"translation_to", "metric":"bleu", - "score":0.4660772497 + "score":0.7309888475 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"en", "task":"translation_to", "metric":"chrf", - "score":0.7280386297 + "score":0.8534239972 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"es", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"es", "task":"mgsm", "metric":"accuracy", - "score":1.0 + "score":0.3 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"es", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.3593767686 + "score":0.3497891701 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.5668073679 + "score":0.5889817614 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"es", "task":"translation_to", "metric":"bleu", - "score":0.3662275621 + "score":0.395885417 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"es", "task":"translation_to", "metric":"chrf", - "score":0.6102640711 + "score":0.6273835234 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"fa", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"fa", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"fa", "task":"translation_from", "metric":"bleu", - "score":0.286051969 + "score":0.3764428485 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"fa", "task":"translation_from", "metric":"chrf", - "score":0.5373856549 + "score":0.5794911256 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"fa", "task":"translation_to", "metric":"bleu", - "score":0.1816947237 + "score":0.3019679958 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"fa", "task":"translation_to", "metric":"chrf", - "score":0.3981159206 + "score":0.5314471888 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"fil", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"fil", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"fil", "task":"translation_from", "metric":"bleu", - "score":0.3579818144 + "score":0.3970330872 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"fil", "task":"translation_from", "metric":"chrf", - "score":0.5889481625 + "score":0.6224300541 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"fil", "task":"translation_to", "metric":"bleu", - "score":0.3403832088 + "score":0.3731416111 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"fil", "task":"translation_to", "metric":"chrf", - "score":0.590264879 + "score":0.6421804886 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"fr", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"fr", "task":"mgsm", "metric":"accuracy", - "score":1.0 + "score":0.5 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"fr", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.3180384008 + "score":0.3737227872 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.5571267732 + "score":0.6039484183 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"fr", "task":"translation_to", "metric":"bleu", - "score":0.5778354146 + "score":0.5555743798 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"fr", "task":"translation_to", "metric":"chrf", - "score":0.7490356238 + "score":0.7229519037 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"fuv", "task":"classification", "metric":"accuracy", - "score":0.6 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"fuv", "task":"translation_from", "metric":"bleu", - "score":0.0380719948 + "score":0.0654195918 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"fuv", "task":"translation_from", "metric":"chrf", - "score":0.2066039108 + "score":0.2431272498 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"fuv", "task":"translation_to", "metric":"bleu", - "score":0.0259757351 + "score":0.0469027058 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"fuv", "task":"translation_to", "metric":"chrf", - "score":0.147148937 + "score":0.2599881115 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"gu", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"gu", "task":"translation_from", "metric":"bleu", - "score":0.34811918 + "score":0.344471287 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"gu", "task":"translation_from", "metric":"chrf", - "score":0.5482709715 + "score":0.5591834446 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"gu", "task":"translation_to", "metric":"bleu", - "score":0.1618983325 + "score":0.180119873 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"gu", "task":"translation_to", "metric":"chrf", - "score":0.4411905252 + "score":0.4654772276 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ha", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ha", "task":"mgsm", "metric":"accuracy", "score":0.5 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ha", "task":"mmlu", "metric":"accuracy", - "score":0.4 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ha", "task":"translation_from", "metric":"bleu", - "score":0.1925315551 + "score":0.2852268084 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ha", "task":"translation_from", "metric":"chrf", - "score":0.4032389241 + "score":0.4820918601 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ha", "task":"translation_to", "metric":"bleu", - "score":0.1992720083 + "score":0.318588004 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ha", "task":"translation_to", "metric":"chrf", - "score":0.4905441802 + "score":0.5675346049 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"hi", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"hi", "task":"mmlu", "metric":"accuracy", - "score":1.0 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.3722751955 + "score":0.4387215588 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.6207213131 + "score":0.6443095169 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"hi", "task":"translation_to", "metric":"bleu", - "score":0.3378499277 + "score":0.4255607348 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"hi", "task":"translation_to", "metric":"chrf", - "score":0.554090013 + "score":0.6457270128 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"hne", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"hne", "task":"translation_from", "metric":"bleu", - "score":0.2879989689 + "score":0.336133928 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"hne", "task":"translation_from", "metric":"chrf", - "score":0.5083598943 + "score":0.545638091 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"hne", "task":"translation_to", "metric":"bleu", - "score":0.1719225434 + "score":0.1683321583 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"hne", "task":"translation_to", "metric":"chrf", - "score":0.3992950999 + "score":0.4261207547 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ht", "task":"classification", "metric":"accuracy", "score":0.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ht", "task":"translation_from", "metric":"bleu", "score":0.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ht", "task":"translation_from", "metric":"chrf", "score":0.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ht", "task":"translation_to", "metric":"bleu", "score":0.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ht", "task":"translation_to", "metric":"chrf", "score":0.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"hu", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"hu", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"hu", "task":"translation_from", "metric":"bleu", - "score":0.3234067809 + "score":0.3151646581 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"hu", "task":"translation_from", "metric":"chrf", - "score":0.5706707095 + "score":0.5599039863 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"hu", "task":"translation_to", "metric":"bleu", - "score":0.3187264685 + "score":0.4642022823 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"hu", "task":"translation_to", "metric":"chrf", - "score":0.5856828402 + "score":0.6720003623 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"id", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"id", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.3583744222 + "score":0.3789722313 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.5732194975 + "score":0.5973074889 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"id", "task":"translation_to", "metric":"bleu", - "score":0.3364664006 + "score":0.406320567 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"id", "task":"translation_to", "metric":"chrf", - "score":0.6438910651 + "score":0.6828299565 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ig", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ig", "task":"mgsm", "metric":"accuracy", - "score":0.5 + "score":0.4 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ig", "task":"mmlu", "metric":"accuracy", - "score":0.3 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ig", "task":"translation_from", "metric":"bleu", - "score":0.225000401 + "score":0.2779082008 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ig", "task":"translation_from", "metric":"chrf", - "score":0.4567066441 + "score":0.5108078595 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ig", "task":"translation_to", "metric":"bleu", - "score":0.1941055199 + "score":0.2835120188 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ig", "task":"translation_to", "metric":"chrf", - "score":0.4504811493 + "score":0.5067796001 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ilo", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ilo", "task":"translation_from", "metric":"bleu", - "score":0.1944477164 + "score":0.2679844764 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ilo", "task":"translation_from", "metric":"chrf", - "score":0.4517028309 + "score":0.5037933164 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ilo", "task":"translation_to", "metric":"bleu", - "score":0.2035517344 + "score":0.243508886 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ilo", "task":"translation_to", "metric":"chrf", - "score":0.489419705 + "score":0.5329216971 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"it", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"it", "task":"mgsm", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"it", "task":"mmlu", "metric":"accuracy", "score":0.7 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"it", "task":"translation_from", "metric":"bleu", - "score":0.3074361781 + "score":0.3177725576 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"it", "task":"translation_from", "metric":"chrf", - "score":0.5178180754 + "score":0.5648818053 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"it", "task":"translation_to", "metric":"bleu", - "score":0.3505959215 + "score":0.3654943432 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"it", "task":"translation_to", "metric":"chrf", - "score":0.5955060476 + "score":0.5949572053 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ja", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ja", "task":"mgsm", "metric":"accuracy", - "score":0.6 + "score":0.5 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ja", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.2581140706 + "score":0.3423388267 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.5395853617 + "score":0.5884893314 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ja", "task":"translation_to", "metric":"bleu", - "score":0.3298839393 + "score":0.3740472584 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ja", "task":"translation_to", "metric":"chrf", - "score":0.4471547552 + "score":0.4832664839 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"jv", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.3177915441 + "score":0.3540174328 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.5387853038 + "score":0.5513315973 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"jv", "task":"translation_to", "metric":"bleu", - "score":0.2549228547 + "score":0.329885986 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"jv", "task":"translation_to", "metric":"chrf", - "score":0.5322440265 + "score":0.5805485408 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ki", "task":"classification", "metric":"accuracy", "score":0.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ki", "task":"translation_from", "metric":"bleu", "score":0.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ki", "task":"translation_from", "metric":"chrf", "score":0.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ki", "task":"translation_to", "metric":"bleu", "score":0.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ki", "task":"translation_to", "metric":"chrf", "score":0.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"kk", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"kk", "task":"translation_from", "metric":"bleu", - "score":0.1983700044 + "score":0.2553025069 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"kk", "task":"translation_from", "metric":"chrf", - "score":0.4843458319 + "score":0.5408614418 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"kk", "task":"translation_to", "metric":"bleu", - "score":0.2920207746 + "score":0.3062994849 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"kk", "task":"translation_to", "metric":"chrf", - "score":0.5345155349 + "score":0.58504635 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"km", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"km", "task":"translation_from", "metric":"bleu", - "score":0.3702042307 + "score":0.3700483899 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"km", "task":"translation_from", "metric":"chrf", - "score":0.5776853975 + "score":0.6006134318 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"km", "task":"translation_to", "metric":"bleu", - "score":0.1498433716 + "score":0.2315452529 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"km", "task":"translation_to", "metric":"chrf", - "score":0.3652702605 + "score":0.4617416997 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"kn", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"kn", "task":"translation_from", "metric":"bleu", - "score":0.2858443353 + "score":0.2512885128 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"kn", "task":"translation_from", "metric":"chrf", - "score":0.5499221943 + "score":0.4934774392 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"kn", "task":"translation_to", "metric":"bleu", - "score":0.2481102245 + "score":0.3278617048 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"kn", "task":"translation_to", "metric":"chrf", - "score":0.4829685786 + "score":0.5102619479 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ko", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ko", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ko", "task":"translation_from", "metric":"bleu", - "score":0.2305492704 + "score":0.2465751079 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ko", "task":"translation_from", "metric":"chrf", - "score":0.4826740501 + "score":0.515705028 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ko", "task":"translation_to", "metric":"bleu", - "score":0.1746024172 + "score":0.2528779436 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ko", "task":"translation_to", "metric":"chrf", - "score":0.3073554703 + "score":0.3488788279 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"lua", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"lua", "task":"translation_from", "metric":"bleu", - "score":0.0913600379 + "score":0.0591613845 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"lua", "task":"translation_from", "metric":"chrf", - "score":0.3305636235 + "score":0.2662007935 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"lua", "task":"translation_to", "metric":"bleu", - "score":0.0269728382 + "score":0.0779434955 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"lua", "task":"translation_to", "metric":"chrf", - "score":0.3155017027 + "score":0.3095367271 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"mag", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"mag", "task":"translation_from", "metric":"bleu", - "score":0.3751831337 + "score":0.3908377774 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"mag", "task":"translation_from", "metric":"chrf", - "score":0.6085851316 + "score":0.6260985434 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"mag", "task":"translation_to", "metric":"bleu", - "score":0.259988405 + "score":0.3130016025 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"mag", "task":"translation_to", "metric":"chrf", - "score":0.5046714005 + "score":0.5391710538 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"mai", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"mai", "task":"translation_from", "metric":"bleu", - "score":0.306099972 + "score":0.3471192 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"mai", "task":"translation_from", "metric":"chrf", - "score":0.5370842801 + "score":0.5771683143 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"mai", "task":"translation_to", "metric":"bleu", - "score":0.1736022871 + "score":0.2207082106 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"mai", "task":"translation_to", "metric":"chrf", - "score":0.4305653856 + "score":0.4870892013 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"mg", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"mg", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"mg", "task":"translation_from", "metric":"bleu", - "score":0.2826629018 + "score":0.2993063676 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"mg", "task":"translation_from", "metric":"chrf", - "score":0.5215979873 + "score":0.5474937127 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"mg", "task":"translation_to", "metric":"bleu", - "score":0.238462643 + "score":0.2153101678 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"mg", "task":"translation_to", "metric":"chrf", - "score":0.5334745774 + "score":0.5379094165 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ml", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ml", "task":"translation_from", "metric":"bleu", - "score":0.3161992509 + "score":0.3532448793 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ml", "task":"translation_from", "metric":"chrf", - "score":0.5479755911 + "score":0.5657281022 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ml", "task":"translation_to", "metric":"bleu", - "score":0.2133071404 + "score":0.3046979511 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ml", "task":"translation_to", "metric":"chrf", - "score":0.4660281027 + "score":0.5523287159 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"mr", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.2370074805 + "score":0.3055522766 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.4804215458 + "score":0.5435968357 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"mr", "task":"translation_to", "metric":"bleu", - "score":0.2399769139 + "score":0.257460039 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"mr", "task":"translation_to", "metric":"chrf", - "score":0.4726429935 + "score":0.4845716024 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ms", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ms", "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ms", "task":"translation_from", "metric":"bleu", - "score":0.3104483533 + "score":0.3746934831 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ms", "task":"translation_from", "metric":"chrf", - "score":0.5705763492 + "score":0.6046609636 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ms", "task":"translation_to", "metric":"bleu", - "score":0.4229626959 + "score":0.4734156929 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ms", "task":"translation_to", "metric":"chrf", - "score":0.6856510383 + "score":0.7284733826 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"my", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"my", "task":"translation_from", "metric":"bleu", - "score":0.2227645269 + "score":0.3552781219 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"my", "task":"translation_from", "metric":"chrf", - "score":0.4888582617 + "score":0.5977013775 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"my", "task":"translation_to", "metric":"bleu", - "score":0.1869632744 + "score":0.3211140622 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"my", "task":"translation_to", "metric":"chrf", - "score":0.4322398057 + "score":0.544805929 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ne", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ne", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ne", "task":"translation_from", "metric":"bleu", - "score":0.3115387303 + "score":0.3774439938 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ne", "task":"translation_from", "metric":"chrf", - "score":0.5342290246 + "score":0.599804205 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ne", "task":"translation_to", "metric":"bleu", - "score":0.22081567 + "score":0.2861323795 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ne", "task":"translation_to", "metric":"chrf", - "score":0.4878836055 + "score":0.5180107937 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"nl", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"nl", "task":"mgsm", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"nl", "task":"mmlu", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"nl", "task":"translation_from", "metric":"bleu", - "score":0.3125704924 + "score":0.312116976 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"nl", "task":"translation_from", "metric":"chrf", - "score":0.5397676594 + "score":0.5463170004 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"nl", "task":"translation_to", "metric":"bleu", - "score":0.3586968371 + "score":0.3780530389 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"nl", "task":"translation_to", "metric":"chrf", - "score":0.6075205554 + "score":0.6232733213 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ny", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ny", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ny", "task":"translation_from", "metric":"bleu", - "score":0.1901221224 + "score":0.2177968416 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ny", "task":"translation_from", "metric":"chrf", - "score":0.438728736 + "score":0.4415294523 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ny", "task":"translation_to", "metric":"bleu", - "score":0.1330024304 + "score":0.1367315108 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ny", "task":"translation_to", "metric":"chrf", - "score":0.4711022084 + "score":0.4585024296 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"om", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"om", "task":"mgsm", "metric":"accuracy", - "score":0.1 + "score":0.3 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"om", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"om", "task":"translation_from", "metric":"bleu", - "score":0.0258426139 + "score":0.1871006972 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"om", "task":"translation_from", "metric":"chrf", - "score":0.2237241232 + "score":0.4365658925 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"om", "task":"translation_to", "metric":"bleu", - "score":0.0460531144 + "score":0.106229994 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"om", "task":"translation_to", "metric":"chrf", - "score":0.3418147419 + "score":0.4277182017 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"or", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"or", "task":"translation_from", "metric":"bleu", - "score":0.3714452662 + "score":0.3740486194 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"or", "task":"translation_from", "metric":"chrf", - "score":0.5977153904 + "score":0.6141131486 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"or", "task":"translation_to", "metric":"bleu", - "score":0.2234825764 + "score":0.31231668 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"or", "task":"translation_to", "metric":"chrf", - "score":0.4562477173 + "score":0.5222572922 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"pa", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.4180718844 + "score":0.4182659606 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.6426219278 + "score":0.6696655487 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"pa", "task":"translation_to", "metric":"bleu", - "score":0.3938693136 + "score":0.4665320226 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"pa", "task":"translation_to", "metric":"chrf", - "score":0.5573992167 + "score":0.6280330147 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"pl", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"pl", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.7 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"pl", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"pl", "task":"translation_from", "metric":"bleu", - "score":0.2456102401 + "score":0.3282584844 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"pl", "task":"translation_from", "metric":"chrf", - "score":0.5190609119 + "score":0.5713765921 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"pl", "task":"translation_to", "metric":"bleu", - "score":0.4265619216 + "score":0.3762753954 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"pl", "task":"translation_to", "metric":"chrf", - "score":0.6320824157 + "score":0.5940500139 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"pt", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"pt", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.3537745123 + "score":0.3485890022 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.5904429929 + "score":0.574915747 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.4588664196 + "score":0.4760104707 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.6844540285 + "score":0.6891420805 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ro", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ro", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.7 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ro", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ro", "task":"translation_from", "metric":"bleu", - "score":0.3139442337 + "score":0.3285564053 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ro", "task":"translation_from", "metric":"chrf", - "score":0.5741447282 + "score":0.5835489949 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ro", "task":"translation_to", "metric":"bleu", - "score":0.5016049999 + "score":0.5863602394 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ro", "task":"translation_to", "metric":"chrf", - "score":0.6788048008 + "score":0.7345305045 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ru", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ru", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.6 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ru", "task":"mmlu", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.2449777422 + "score":0.2893557086 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.5268764903 + "score":0.5514512546 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ru", "task":"translation_to", "metric":"bleu", - "score":0.3789708434 + "score":0.4910352633 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ru", "task":"translation_to", "metric":"chrf", - "score":0.5790333031 + "score":0.6636379715 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"rw", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"rw", "task":"mgsm", "metric":"accuracy", "score":0.3 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"rw", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"rw", "task":"translation_from", "metric":"bleu", - "score":0.1839360587 + "score":0.2768738298 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"rw", "task":"translation_from", "metric":"chrf", - "score":0.448997409 + "score":0.5136190092 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"rw", "task":"translation_to", "metric":"bleu", - "score":0.1891835724 + "score":0.2743310586 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"rw", "task":"translation_to", "metric":"chrf", - "score":0.508623725 + "score":0.5596031593 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sd", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sd", "task":"translation_from", "metric":"bleu", - "score":0.3352727297 + "score":0.3296224998 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sd", "task":"translation_from", "metric":"chrf", - "score":0.5583215205 + "score":0.5499189472 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sd", "task":"translation_to", "metric":"bleu", - "score":0.2009000601 + "score":0.2231786181 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sd", "task":"translation_to", "metric":"chrf", - "score":0.4004383195 + "score":0.407169401 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"si", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"si", "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"si", "task":"translation_from", "metric":"bleu", - "score":0.2297304995 + "score":0.2632131459 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"si", "task":"translation_from", "metric":"chrf", - "score":0.5040607132 + "score":0.4981476408 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"si", "task":"translation_to", "metric":"bleu", - "score":0.2136543311 + "score":0.3150668549 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"si", "task":"translation_to", "metric":"chrf", - "score":0.3916393466 + "score":0.466344362 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sn", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sn", "task":"mgsm", "metric":"accuracy", - "score":0.6 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sn", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sn", "task":"translation_from", "metric":"bleu", - "score":0.1221415503 + "score":0.1425864886 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sn", "task":"translation_from", "metric":"chrf", - "score":0.3516954503 + "score":0.3921687091 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sn", "task":"translation_to", "metric":"bleu", - "score":0.108688779 + "score":0.1876717865 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sn", "task":"translation_to", "metric":"chrf", - "score":0.4515663403 + "score":0.4923376927 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"so", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"so", "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"so", "task":"translation_from", "metric":"bleu", - "score":0.2308889646 + "score":0.2921978364 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"so", "task":"translation_from", "metric":"chrf", - "score":0.4618048204 + "score":0.5121729513 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"so", "task":"translation_to", "metric":"bleu", - "score":0.1667302795 + "score":0.2437506181 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"so", "task":"translation_to", "metric":"chrf", - "score":0.4717296026 + "score":0.511793128 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sr", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sr", "task":"mmlu", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sr", "task":"translation_from", "metric":"bleu", - "score":0.2351861569 + "score":0.3070769379 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sr", "task":"translation_from", "metric":"chrf", - "score":0.5329036218 + "score":0.5829431146 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sr", "task":"translation_to", "metric":"bleu", - "score":0.4168384094 + "score":0.4562210568 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sr", "task":"translation_to", "metric":"chrf", - "score":0.6032787874 + "score":0.6349957477 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"su", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"su", "task":"translation_from", "metric":"bleu", - "score":0.2291561983 + "score":0.2923338131 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"su", "task":"translation_from", "metric":"chrf", - "score":0.4673987803 + "score":0.4917795718 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"su", "task":"translation_to", "metric":"bleu", - "score":0.2036733766 + "score":0.2448808161 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"su", "task":"translation_to", "metric":"chrf", - "score":0.5047620958 + "score":0.5213243396 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sv", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sv", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sv", "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sv", "task":"translation_from", "metric":"bleu", - "score":0.3500384253 + "score":0.340913979 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sv", "task":"translation_from", "metric":"chrf", - "score":0.5797456052 + "score":0.5878242881 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sv", "task":"translation_to", "metric":"bleu", - "score":0.4268868445 + "score":0.4174508433 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sv", "task":"translation_to", "metric":"chrf", - "score":0.664863412 + "score":0.6558948574 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sw", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sw", "task":"mgsm", "metric":"accuracy", - "score":1.0 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sw", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.3005035588 + "score":0.397583037 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.5210660172 + "score":0.6014699575 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sw", "task":"translation_to", "metric":"bleu", - "score":0.3401968092 + "score":0.4540021563 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"sw", "task":"translation_to", "metric":"chrf", - "score":0.6217197146 + "score":0.7002830052 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ta", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ta", "task":"translation_from", "metric":"bleu", - "score":0.2662307086 + "score":0.2981018347 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ta", "task":"translation_from", "metric":"chrf", - "score":0.5053585639 + "score":0.5573394656 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ta", "task":"translation_to", "metric":"bleu", - "score":0.3044345778 + "score":0.3033361537 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ta", "task":"translation_to", "metric":"chrf", - "score":0.5714036731 + "score":0.5406646936 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"te", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"te", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.1 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"te", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.3330093484 + "score":0.4025505277 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.5694168709 + "score":0.6339036498 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"te", "task":"translation_to", "metric":"bleu", - "score":0.257812168 + "score":0.4166086163 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"te", "task":"translation_to", "metric":"chrf", - "score":0.5167002436 + "score":0.6171953291 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"tg", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"tg", "task":"translation_from", "metric":"bleu", - "score":0.2176170344 + "score":0.2859260679 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"tg", "task":"translation_from", "metric":"chrf", - "score":0.4496406258 + "score":0.5305344486 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"tg", "task":"translation_to", "metric":"bleu", - "score":0.2605536967 + "score":0.3454858711 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"tg", "task":"translation_to", "metric":"chrf", - "score":0.4816066849 + "score":0.5585923193 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"th", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"th", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"th", "task":"translation_from", "metric":"bleu", - "score":0.2992360169 + "score":0.3196721957 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"th", "task":"translation_from", "metric":"chrf", - "score":0.5585599708 + "score":0.5597673276 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"th", "task":"translation_to", "metric":"bleu", - "score":0.4269079012 + "score":0.4114706745 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"th", "task":"translation_to", "metric":"chrf", - "score":0.5719718715 + "score":0.560767027 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ti", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ti", "task":"translation_from", "metric":"bleu", - "score":0.2042995208 + "score":0.2476296934 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ti", "task":"translation_from", "metric":"chrf", - "score":0.416626147 + "score":0.5033069835 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ti", "task":"translation_to", "metric":"bleu", - "score":0.0833250166 + "score":0.1179117378 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ti", "task":"translation_to", "metric":"chrf", - "score":0.1982489294 + "score":0.2587205011 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"tr", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"tr", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"tr", "task":"translation_from", "metric":"bleu", - "score":0.2832304201 + "score":0.3291780472 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"tr", "task":"translation_from", "metric":"chrf", - "score":0.5467240003 + "score":0.5900439285 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"tr", "task":"translation_to", "metric":"bleu", - "score":0.3273464288 + "score":0.4285247051 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"tr", "task":"translation_to", "metric":"chrf", - "score":0.5827048506 + "score":0.6508035663 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"uk", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"uk", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"uk", "task":"translation_from", "metric":"bleu", - "score":0.2813742416 + "score":0.3407035036 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"uk", "task":"translation_from", "metric":"chrf", - "score":0.5413704266 + "score":0.583433778 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"uk", "task":"translation_to", "metric":"bleu", - "score":0.4063054094 + "score":0.4167194618 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"uk", "task":"translation_to", "metric":"chrf", - "score":0.6020718231 + "score":0.6135073244 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"umb", "task":"classification", "metric":"accuracy", "score":0.7 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"umb", "task":"translation_from", "metric":"bleu", - "score":0.0495917134 + "score":0.0287200326 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"umb", "task":"translation_from", "metric":"chrf", - "score":0.1711087397 + "score":0.1566177223 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"umb", "task":"translation_to", "metric":"bleu", - "score":0.0358872001 + "score":0.0503465615 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"umb", "task":"translation_to", "metric":"chrf", - "score":0.2761667256 + "score":0.21805483 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ur", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":0.322448107 + "score":0.3212777323 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":0.5887654616 + "score":0.5735084601 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ur", "task":"translation_to", "metric":"bleu", - "score":0.2148139783 + "score":0.3027958989 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"ur", "task":"translation_to", "metric":"chrf", - "score":0.4226865444 + "score":0.4912965943 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"uz", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"uz", "task":"translation_from", "metric":"bleu", - "score":0.2829644119 + "score":0.2583582755 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"uz", "task":"translation_from", "metric":"chrf", - "score":0.5194956482 + "score":0.483302551 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"uz", "task":"translation_to", "metric":"bleu", - "score":0.2911955464 + "score":0.3579243963 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"uz", "task":"translation_to", "metric":"chrf", - "score":0.5560139888 + "score":0.6083657804 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"vi", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"vi", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.2745000434 + "score":0.3471784526 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.5206422805 + "score":0.5719753053 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"vi", "task":"translation_to", "metric":"bleu", - "score":0.4261790941 + "score":0.4601231177 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"vi", "task":"translation_to", "metric":"chrf", - "score":0.6358462464 + "score":0.6644848789 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"wo", "task":"classification", "metric":"accuracy", - "score":0.6 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"wo", "task":"mgsm", "metric":"accuracy", - "score":0.0 + "score":0.4 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"wo", "task":"mmlu", "metric":"accuracy", - "score":0.2 + "score":0.5 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"wo", "task":"translation_from", "metric":"bleu", - "score":0.0696458062 + "score":0.0932068478 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"wo", "task":"translation_from", "metric":"chrf", - "score":0.2461140434 + "score":0.3792197219 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"wo", "task":"translation_to", "metric":"bleu", - "score":0.0728989985 + "score":0.1171143464 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"wo", "task":"translation_to", "metric":"chrf", - "score":0.2267265908 + "score":0.3384795969 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"wuu", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"wuu", "task":"translation_from", "metric":"bleu", - "score":0.2072386748 + "score":0.2968992777 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"wuu", "task":"translation_from", "metric":"chrf", - "score":0.4628288648 + "score":0.5258850631 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"wuu", "task":"translation_to", "metric":"bleu", - "score":0.1471425714 + "score":0.1321430026 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"wuu", "task":"translation_to", "metric":"chrf", - "score":0.1971299212 + "score":0.176594989 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"xh", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"xh", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.6 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"xh", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"xh", "task":"translation_from", "metric":"bleu", - "score":0.253783308 + "score":0.1979226992 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"xh", "task":"translation_from", "metric":"chrf", - "score":0.4487387303 + "score":0.4588070152 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"xh", "task":"translation_to", "metric":"bleu", - "score":0.0662544821 + "score":0.1181506898 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"xh", "task":"translation_to", "metric":"chrf", - "score":0.3784904721 + "score":0.4718021868 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"yo", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"yo", "task":"mgsm", "metric":"accuracy", - "score":0.6 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"yo", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"yo", "task":"translation_from", "metric":"bleu", - "score":0.0887390501 + "score":0.1110331374 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"yo", "task":"translation_from", "metric":"chrf", - "score":0.3201148841 + "score":0.3622261661 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"yo", "task":"translation_to", "metric":"bleu", - "score":0.1178050815 + "score":0.1764819134 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"yo", "task":"translation_to", "metric":"chrf", - "score":0.307433063 + "score":0.3463753843 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"yue", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"yue", "task":"translation_from", "metric":"bleu", - "score":0.2253512269 + "score":0.2756047962 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"yue", "task":"translation_from", "metric":"chrf", - "score":0.4949150094 + "score":0.518253876 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"yue", "task":"translation_to", "metric":"bleu", - "score":0.1897306863 + "score":0.2356751392 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"yue", "task":"translation_to", "metric":"chrf", - "score":0.2561574259 + "score":0.3051882861 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"zh", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"zh", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.4 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"zh", "task":"mmlu", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.2201641871 + "score":0.2989639846 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.5051068628 + "score":0.5646599732 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"zh", "task":"translation_to", "metric":"bleu", - "score":0.2508351517 + "score":0.2915310914 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"zh", "task":"translation_to", "metric":"chrf", - "score":0.3110461024 + "score":0.3358004159 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"zu", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"zu", "task":"mgsm", "metric":"accuracy", - "score":0.7 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"zu", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"zu", "task":"translation_from", "metric":"bleu", - "score":0.252616884 + "score":0.3429319501 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"zu", "task":"translation_from", "metric":"chrf", - "score":0.4822778382 + "score":0.5895603725 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"zu", "task":"translation_to", "metric":"bleu", - "score":0.1940901676 + "score":0.2713803282 }, { - "model":"google\/gemini-flash-1.5", + "model":"google\/gemini-2.5-flash-preview-05-20", "bcp_47":"zu", "task":"translation_to", "metric":"chrf", - "score":0.4661416094 + "score":0.5773152323 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"aeb", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ar", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"aeb", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro", + "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.2041309024 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"aeb", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.4630820951 + "score":0.0119333611 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"aeb", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ar", "task":"translation_to", "metric":"bleu", - "score":0.1453469275 + "score":0.0433795513 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"aeb", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ar", "task":"translation_to", "metric":"chrf", - "score":0.3874336138 + "score":0.086624937 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"af", + "model":"google\/gemini-2.5-pro", + "bcp_47":"bn", "task":"classification", "metric":"accuracy", "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"af", + "model":"google\/gemini-2.5-pro", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro", + "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.0 + "score":0.1420800017 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"af", + "model":"google\/gemini-2.5-pro", + "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.0 + "score":0.2571278005 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"af", + "model":"google\/gemini-2.5-pro", + "bcp_47":"bn", "task":"translation_to", "metric":"bleu", - "score":0.0 + "score":0.0740143168 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"af", + "model":"google\/gemini-2.5-pro", + "bcp_47":"bn", "task":"translation_to", "metric":"chrf", - "score":0.0 + "score":0.0900638149 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ak", + "model":"google\/gemini-2.5-pro", + "bcp_47":"de", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ak", + "model":"google\/gemini-2.5-pro", + "bcp_47":"de", "task":"mgsm", "metric":"accuracy", - "score":0.2 + "score":0.1 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ak", + "model":"google\/gemini-2.5-pro", + "bcp_47":"de", "task":"mmlu", "metric":"accuracy", - "score":0.4 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ak", + "model":"google\/gemini-2.5-pro", + "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.1059711376 + "score":0.075270263 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ak", + "model":"google\/gemini-2.5-pro", + "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.300568481 + "score":0.1801898422 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ak", + "model":"google\/gemini-2.5-pro", + "bcp_47":"de", "task":"translation_to", "metric":"bleu", - "score":0.0110669593 + "score":0.079678832 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ak", + "model":"google\/gemini-2.5-pro", + "bcp_47":"de", "task":"translation_to", "metric":"chrf", - "score":0.2141540563 + "score":0.1387482052 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"am", + "model":"google\/gemini-2.5-pro", + "bcp_47":"en", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"am", + "model":"google\/gemini-2.5-pro", + "bcp_47":"en", "task":"mgsm", "metric":"accuracy", - "score":0.5 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"am", + "model":"google\/gemini-2.5-pro", + "bcp_47":"en", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"am", + "model":"google\/gemini-2.5-pro", + "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.1906134629 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"am", + "model":"google\/gemini-2.5-pro", + "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.4467868389 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"am", + "model":"google\/gemini-2.5-pro", + "bcp_47":"en", "task":"translation_to", "metric":"bleu", - "score":0.2001643223 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"am", + "model":"google\/gemini-2.5-pro", + "bcp_47":"en", "task":"translation_to", "metric":"chrf", - "score":0.3225170104 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"apc", + "model":"google\/gemini-2.5-pro", + "bcp_47":"es", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"apc", + "model":"google\/gemini-2.5-pro", + "bcp_47":"es", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemini-2.5-pro", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro", + "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.1876459632 + "score":0.0322638642 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"apc", + "model":"google\/gemini-2.5-pro", + "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.4830875841 + "score":0.1070675634 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"apc", + "model":"google\/gemini-2.5-pro", + "bcp_47":"es", "task":"translation_to", "metric":"bleu", - "score":0.1830944017 + "score":0.1132855578 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"apc", + "model":"google\/gemini-2.5-pro", + "bcp_47":"es", "task":"translation_to", "metric":"chrf", - "score":0.4175337587 + "score":0.2363989029 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", + "model":"google\/gemini-2.5-pro", + "bcp_47":"fa", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", + "model":"google\/gemini-2.5-pro", + "bcp_47":"fa", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", + "model":"google\/gemini-2.5-pro", + "bcp_47":"fa", "task":"translation_from", "metric":"bleu", - "score":0.260683336 + "score":0.0628255969 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", + "model":"google\/gemini-2.5-pro", + "bcp_47":"fa", "task":"translation_from", "metric":"chrf", - "score":0.5383651277 + "score":0.1404540616 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", + "model":"google\/gemini-2.5-pro", + "bcp_47":"fa", "task":"translation_to", "metric":"bleu", - "score":0.2962406565 + "score":0.0929691836 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ar", + "model":"google\/gemini-2.5-pro", + "bcp_47":"fa", "task":"translation_to", "metric":"chrf", - "score":0.5190026627 + "score":0.1936176153 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ary", + "model":"google\/gemini-2.5-pro", + "bcp_47":"fr", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ary", + "model":"google\/gemini-2.5-pro", + "bcp_47":"fr", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-pro", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro", + "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.1438491224 + "score":0.1363784433 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ary", + "model":"google\/gemini-2.5-pro", + "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.418499848 + "score":0.2546980579 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ary", + "model":"google\/gemini-2.5-pro", + "bcp_47":"fr", "task":"translation_to", "metric":"bleu", - "score":0.1044262978 + "score":0.2831711013 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ary", + "model":"google\/gemini-2.5-pro", + "bcp_47":"fr", "task":"translation_to", "metric":"chrf", - "score":0.3577242047 + "score":0.423402744 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"arz", + "model":"google\/gemini-2.5-pro", + "bcp_47":"hi", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"arz", + "model":"google\/gemini-2.5-pro", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro", + "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.1675595946 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"arz", + "model":"google\/gemini-2.5-pro", + "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.4187188467 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"arz", + "model":"google\/gemini-2.5-pro", + "bcp_47":"hi", "task":"translation_to", "metric":"bleu", - "score":0.1545869288 + "score":0.046932578 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"arz", + "model":"google\/gemini-2.5-pro", + "bcp_47":"hi", "task":"translation_to", "metric":"chrf", - "score":0.4031218248 + "score":0.1114891082 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"as", + "model":"google\/gemini-2.5-pro", + "bcp_47":"id", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"as", + "model":"google\/gemini-2.5-pro", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro", + "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.1892328534 + "score":0.0849232664 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"as", + "model":"google\/gemini-2.5-pro", + "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.4434206925 + "score":0.1180502872 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"as", + "model":"google\/gemini-2.5-pro", + "bcp_47":"id", "task":"translation_to", "metric":"bleu", - "score":0.1070430926 + "score":0.16572501 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"as", + "model":"google\/gemini-2.5-pro", + "bcp_47":"id", "task":"translation_to", "metric":"chrf", - "score":0.3318636339 + "score":0.2936653353 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"awa", + "model":"google\/gemini-2.5-pro", + "bcp_47":"it", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"awa", + "model":"google\/gemini-2.5-pro", + "bcp_47":"it", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-pro", + "bcp_47":"it", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro", + "bcp_47":"it", "task":"translation_from", "metric":"bleu", - "score":0.3180630074 + "score":0.0353192374 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"awa", + "model":"google\/gemini-2.5-pro", + "bcp_47":"it", "task":"translation_from", "metric":"chrf", - "score":0.5401606876 + "score":0.0912070168 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"awa", + "model":"google\/gemini-2.5-pro", + "bcp_47":"it", "task":"translation_to", "metric":"bleu", - "score":0.1993490206 + "score":0.0843198982 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"awa", + "model":"google\/gemini-2.5-pro", + "bcp_47":"it", "task":"translation_to", "metric":"chrf", - "score":0.4215901923 + "score":0.1834427215 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"az", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ja", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"az", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-pro", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro", + "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.1604267099 + "score":0.1728301922 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"az", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.4139767864 + "score":0.2722873664 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"az", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ja", "task":"translation_to", "metric":"bleu", - "score":0.1651025864 + "score":0.0452386704 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"az", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ja", "task":"translation_to", "metric":"chrf", - "score":0.3978212407 + "score":0.0759200811 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"be", + "model":"google\/gemini-2.5-pro", + "bcp_47":"jv", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"be", + "model":"google\/gemini-2.5-pro", + "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.19213953 + "score":0.1519234884 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"be", + "model":"google\/gemini-2.5-pro", + "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.4512512424 + "score":0.2526899598 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"be", + "model":"google\/gemini-2.5-pro", + "bcp_47":"jv", "task":"translation_to", "metric":"bleu", - "score":0.2406657525 + "score":0.0370612896 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"be", + "model":"google\/gemini-2.5-pro", + "bcp_47":"jv", "task":"translation_to", "metric":"chrf", - "score":0.4536513075 + "score":0.1525405786 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bho", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ko", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bho", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ko", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro", + "bcp_47":"ko", "task":"translation_from", "metric":"bleu", - "score":0.2519150677 + "score":0.0673608539 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bho", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ko", "task":"translation_from", "metric":"chrf", - "score":0.4966963131 + "score":0.1795707438 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bho", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ko", "task":"translation_to", "metric":"bleu", - "score":0.2057435019 + "score":0.0936480171 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bho", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ko", "task":"translation_to", "metric":"chrf", - "score":0.4016427491 + "score":0.1378127408 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bm", + "model":"google\/gemini-2.5-pro", + "bcp_47":"mr", "task":"classification", "metric":"accuracy", "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bm", + "model":"google\/gemini-2.5-pro", + "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.0 + "score":0.1331943797 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bm", + "model":"google\/gemini-2.5-pro", + "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.0 + "score":0.2183301061 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bm", + "model":"google\/gemini-2.5-pro", + "bcp_47":"mr", "task":"translation_to", "metric":"bleu", - "score":0.0 + "score":0.0187720962 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bm", + "model":"google\/gemini-2.5-pro", + "bcp_47":"mr", "task":"translation_to", "metric":"chrf", - "score":0.0 + "score":0.0552092745 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", + "model":"google\/gemini-2.5-pro", + "bcp_47":"pa", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"mgsm", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", + "model":"google\/gemini-2.5-pro", + "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.2183929994 + "score":0.3020434614 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", + "model":"google\/gemini-2.5-pro", + "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.4877941086 + "score":0.4007490688 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", + "model":"google\/gemini-2.5-pro", + "bcp_47":"pa", "task":"translation_to", "metric":"bleu", - "score":0.2700916391 + "score":0.2320524279 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"bn", + "model":"google\/gemini-2.5-pro", + "bcp_47":"pa", "task":"translation_to", "metric":"chrf", - "score":0.5150577414 + "score":0.2712383449 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ca", + "model":"google\/gemini-2.5-pro", + "bcp_47":"pt", "task":"classification", "metric":"accuracy", "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ca", + "model":"google\/gemini-2.5-pro", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro", + "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.0 + "score":0.1557590383 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ca", + "model":"google\/gemini-2.5-pro", + "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.0 + "score":0.2999541814 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ca", + "model":"google\/gemini-2.5-pro", + "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.0 + "score":0.2122477941 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ca", + "model":"google\/gemini-2.5-pro", + "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.0 + "score":0.2481311219 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ceb", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ru", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ceb", - "task":"translation_from", - "metric":"bleu", - "score":0.2900668497 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ceb", - "task":"translation_from", - "metric":"chrf", - "score":0.5379961095 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ceb", - "task":"translation_to", - "metric":"bleu", - "score":0.3193377157 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ceb", - "task":"translation_to", - "metric":"chrf", - "score":0.5978978692 + "model":"google\/gemini-2.5-pro", + "bcp_47":"ru", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ckb", - "task":"classification", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ru", + "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ckb", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.2457083208 + "score":0.0568779007 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ckb", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.4937183307 + "score":0.1090963624 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ckb", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ru", "task":"translation_to", "metric":"bleu", - "score":0.1424911854 + "score":0.2392496577 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ckb", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ru", "task":"translation_to", "metric":"chrf", - "score":0.3546559531 + "score":0.3103186792 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"cs", + "model":"google\/gemini-2.5-pro", + "bcp_47":"sw", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"cs", + "model":"google\/gemini-2.5-pro", + "bcp_47":"sw", "task":"mgsm", "metric":"accuracy", - "score":0.4 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"cs", + "model":"google\/gemini-2.5-pro", + "bcp_47":"sw", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"cs", + "model":"google\/gemini-2.5-pro", + "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.2481120403 + "score":0.0309583316 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"cs", + "model":"google\/gemini-2.5-pro", + "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.5339550423 + "score":0.0727861543 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"cs", + "model":"google\/gemini-2.5-pro", + "bcp_47":"sw", "task":"translation_to", "metric":"bleu", - "score":0.3131426524 + "score":0.2299189265 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"cs", + "model":"google\/gemini-2.5-pro", + "bcp_47":"sw", "task":"translation_to", "metric":"chrf", - "score":0.5548197404 + "score":0.3783014951 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ta", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"mgsm", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.8 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ta", "task":"translation_from", "metric":"bleu", - "score":0.3440655166 + "score":0.0594432616 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ta", "task":"translation_from", "metric":"chrf", - "score":0.563902418 + "score":0.1443026551 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ta", "task":"translation_to", "metric":"bleu", - "score":0.4305522274 + "score":0.0648561428 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"de", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ta", "task":"translation_to", "metric":"chrf", - "score":0.6477508732 + "score":0.0778645979 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"el", + "model":"google\/gemini-2.5-pro", + "bcp_47":"te", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"el", + "model":"google\/gemini-2.5-pro", + "bcp_47":"te", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"el", + "model":"google\/gemini-2.5-pro", + "bcp_47":"te", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"el", + "model":"google\/gemini-2.5-pro", + "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.2080428665 + "score":0.2378006592 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"el", + "model":"google\/gemini-2.5-pro", + "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.4376921278 + "score":0.3506619317 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"el", + "model":"google\/gemini-2.5-pro", + "bcp_47":"te", "task":"translation_to", "metric":"bleu", - "score":0.3106300811 + "score":0.0741460229 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"el", + "model":"google\/gemini-2.5-pro", + "bcp_47":"te", "task":"translation_to", "metric":"chrf", - "score":0.4971105137 + "score":0.1278099202 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", + "model":"google\/gemini-2.5-pro", + "bcp_47":"tr", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", + "model":"google\/gemini-2.5-pro", + "bcp_47":"tr", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", + "model":"google\/gemini-2.5-pro", + "bcp_47":"tr", "task":"translation_from", "metric":"bleu", - "score":0.4113463435 + "score":0.0175340474 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", + "model":"google\/gemini-2.5-pro", + "bcp_47":"tr", "task":"translation_from", "metric":"chrf", - "score":0.6260248317 + "score":0.1117737118 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", + "model":"google\/gemini-2.5-pro", + "bcp_47":"tr", "task":"translation_to", "metric":"bleu", - "score":0.5310035709 + "score":0.2807209617 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"en", + "model":"google\/gemini-2.5-pro", + "bcp_47":"tr", "task":"translation_to", "metric":"chrf", - "score":0.7595845064 + "score":0.3753520077 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ur", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"mgsm", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":0.3031284355 + "score":0.0505391541 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":0.5241309352 + "score":0.08189026 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ur", "task":"translation_to", "metric":"bleu", - "score":0.3289699508 + "score":0.0784600421 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"es", + "model":"google\/gemini-2.5-pro", + "bcp_47":"ur", "task":"translation_to", "metric":"chrf", - "score":0.5811203167 + "score":0.1237015541 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fa", + "model":"google\/gemini-2.5-pro", + "bcp_47":"vi", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fa", + "model":"google\/gemini-2.5-pro", + "bcp_47":"vi", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fa", + "model":"google\/gemini-2.5-pro", + "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.2483616515 + "score":0.1167387293 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fa", + "model":"google\/gemini-2.5-pro", + "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.5338391625 + "score":0.1450666727 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fa", + "model":"google\/gemini-2.5-pro", + "bcp_47":"vi", "task":"translation_to", "metric":"bleu", - "score":0.1651229998 + "score":0.3227616178 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fa", + "model":"google\/gemini-2.5-pro", + "bcp_47":"vi", "task":"translation_to", "metric":"chrf", - "score":0.3923963113 + "score":0.4512518394 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fil", + "model":"google\/gemini-2.5-pro", + "bcp_47":"wuu", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fil", - "task":"mmlu", + "model":"google\/gemini-2.5-pro", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"bleu", + "score":0.0673836275 + }, + { + "model":"google\/gemini-2.5-pro", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"chrf", + "score":0.12575806 + }, + { + "model":"google\/gemini-2.5-pro", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"bleu", + "score":0.0232292611 + }, + { + "model":"google\/gemini-2.5-pro", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"chrf", + "score":0.0267312591 + }, + { + "model":"google\/gemini-2.5-pro", + "bcp_47":"yue", + "task":"classification", "metric":"accuracy", - "score":0.7 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fil", + "model":"google\/gemini-2.5-pro", + "bcp_47":"yue", "task":"translation_from", "metric":"bleu", - "score":0.3057177881 + "score":0.0228307046 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fil", + "model":"google\/gemini-2.5-pro", + "bcp_47":"yue", "task":"translation_from", "metric":"chrf", - "score":0.5523945263 + "score":0.1147202951 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fil", + "model":"google\/gemini-2.5-pro", + "bcp_47":"yue", "task":"translation_to", "metric":"bleu", - "score":0.2711892461 + "score":0.0526793492 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fil", + "model":"google\/gemini-2.5-pro", + "bcp_47":"yue", "task":"translation_to", "metric":"chrf", - "score":0.5802332073 + "score":0.0504077394 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", + "model":"google\/gemini-2.5-pro", + "bcp_47":"zh", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", + "model":"google\/gemini-2.5-pro", + "bcp_47":"zh", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", + "model":"google\/gemini-2.5-pro", + "bcp_47":"zh", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", + "model":"google\/gemini-2.5-pro", + "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.3349110908 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", + "model":"google\/gemini-2.5-pro", + "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.564806297 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", + "model":"google\/gemini-2.5-pro", + "bcp_47":"zh", "task":"translation_to", "metric":"bleu", - "score":0.4574014191 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fr", + "model":"google\/gemini-2.5-pro", + "bcp_47":"zh", "task":"translation_to", "metric":"chrf", - "score":0.6626552528 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fuv", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"ar", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fuv", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.0488154154 + "score":0.0474100022 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fuv", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.1944904286 + "score":0.1123198175 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fuv", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"ar", "task":"translation_to", "metric":"bleu", - "score":0.0115014356 + "score":0.0125352085 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"fuv", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"ar", "task":"translation_to", "metric":"chrf", - "score":0.1082073343 + "score":0.0283735992 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"gu", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"bn", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"gu", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.2954497906 + "score":0.1714170596 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"gu", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.5086877895 + "score":0.322217716 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"gu", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"bn", "task":"translation_to", "metric":"bleu", - "score":0.1582270271 + "score":0.0919538797 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"gu", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"bn", "task":"translation_to", "metric":"chrf", - "score":0.4201411039 + "score":0.1130426788 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ha", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"de", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ha", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"de", "task":"mgsm", "metric":"accuracy", - "score":0.5 + "score":0.1 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ha", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"de", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ha", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.1697291765 + "score":0.0507278464 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ha", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.4073157654 + "score":0.1374307154 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ha", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"de", "task":"translation_to", "metric":"bleu", - "score":0.139672818 + "score":0.089396706 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ha", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"de", "task":"translation_to", "metric":"chrf", - "score":0.4450194819 + "score":0.164648643 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"en", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"en", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"en", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.3184042229 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.5712698408 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"en", "task":"translation_to", "metric":"bleu", - "score":0.3659029431 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hi", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"en", "task":"translation_to", "metric":"chrf", - "score":0.5796195236 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hne", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"es", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hne", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"es", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.2791185419 + "score":0.0644544724 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hne", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.5226615992 + "score":0.1431172464 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hne", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"es", "task":"translation_to", "metric":"bleu", - "score":0.145820804 + "score":0.1618106339 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hne", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"es", "task":"translation_to", "metric":"chrf", - "score":0.3820953887 + "score":0.2951594047 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ht", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"fa", "task":"classification", "metric":"accuracy", "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ht", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"fa", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"fa", "task":"translation_from", "metric":"bleu", - "score":0.0 + "score":0.1227062573 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ht", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"fa", "task":"translation_from", "metric":"chrf", - "score":0.0 + "score":0.1954611936 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ht", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"fa", "task":"translation_to", "metric":"bleu", - "score":0.0 + "score":0.0908738713 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ht", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"fa", "task":"translation_to", "metric":"chrf", - "score":0.0 + "score":0.1791636936 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hu", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"fr", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hu", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"fr", "task":"mgsm", "metric":"accuracy", - "score":0.7 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hu", - "task":"translation_from", - "metric":"bleu", - "score":0.2313008892 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hu", - "task":"translation_from", - "metric":"chrf", - "score":0.4915348458 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hu", - "task":"translation_to", - "metric":"bleu", - "score":0.2765024802 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"hu", - "task":"translation_to", - "metric":"chrf", - "score":0.5261755337 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":0.9 + "score":0.1 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"fr", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.2301748885 + "score":0.115635659 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.4682741896 + "score":0.21001665 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"fr", "task":"translation_to", "metric":"bleu", - "score":0.3346592082 + "score":0.1625509988 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"id", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"fr", "task":"translation_to", "metric":"chrf", - "score":0.6514874668 + "score":0.2704886762 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ig", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"hi", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ig", - "task":"mgsm", - "metric":"accuracy", - "score":0.5 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ig", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"hi", "task":"mmlu", "metric":"accuracy", - "score":0.3 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ig", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.154261694 + "score":0.023697236 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ig", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.3957095627 + "score":0.0393020248 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ig", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"hi", "task":"translation_to", "metric":"bleu", - "score":0.1177946719 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ig", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"hi", "task":"translation_to", "metric":"chrf", - "score":0.341868335 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ilo", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"id", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ilo", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.2239397579 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ilo", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.4512212104 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ilo", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"id", "task":"translation_to", "metric":"bleu", - "score":0.135748348 + "score":0.0525040446 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ilo", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"id", "task":"translation_to", "metric":"chrf", - "score":0.4408716957 + "score":0.1506768629 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemini-2.5-pro-preview", "bcp_47":"it", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemini-2.5-pro-preview", "bcp_47":"it", "task":"mgsm", "metric":"accuracy", - "score":0.6 + "score":0.1 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemini-2.5-pro-preview", "bcp_47":"it", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemini-2.5-pro-preview", "bcp_47":"it", "task":"translation_from", "metric":"bleu", - "score":0.2724260509 + "score":0.0597280929 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemini-2.5-pro-preview", "bcp_47":"it", "task":"translation_from", "metric":"chrf", - "score":0.5200202435 + "score":0.1348390312 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemini-2.5-pro-preview", "bcp_47":"it", "task":"translation_to", "metric":"bleu", - "score":0.2753225284 + "score":0.1112548291 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemini-2.5-pro-preview", "bcp_47":"it", "task":"translation_to", "metric":"chrf", - "score":0.5457466615 + "score":0.2280150235 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemini-2.5-pro-preview", "bcp_47":"ja", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemini-2.5-pro-preview", "bcp_47":"ja", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.1 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemini-2.5-pro-preview", "bcp_47":"ja", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemini-2.5-pro-preview", "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.2664966821 + "score":0.0835367034 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemini-2.5-pro-preview", "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.5386982677 + "score":0.1878815782 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemini-2.5-pro-preview", "bcp_47":"ja", "task":"translation_to", "metric":"bleu", - "score":0.2651365589 + "score":0.0362939834 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemini-2.5-pro-preview", "bcp_47":"ja", "task":"translation_to", "metric":"chrf", - "score":0.409095006 + "score":0.0593832479 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemini-2.5-pro-preview", "bcp_47":"jv", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemini-2.5-pro-preview", "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.2326358655 + "score":0.0595037472 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemini-2.5-pro-preview", "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.4815897231 + "score":0.1440055677 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemini-2.5-pro-preview", "bcp_47":"jv", "task":"translation_to", "metric":"bleu", - "score":0.2187928356 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemini-2.5-pro-preview", "bcp_47":"jv", "task":"translation_to", "metric":"chrf", - "score":0.4896578943 + "score":0.1216146696 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ki", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"ko", "task":"classification", "metric":"accuracy", "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ki", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"ko", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"ko", "task":"translation_from", "metric":"bleu", - "score":0.0 + "score":0.0693648124 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ki", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"ko", "task":"translation_from", "metric":"chrf", - "score":0.0 + "score":0.1989936561 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ki", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"ko", "task":"translation_to", "metric":"bleu", - "score":0.0 + "score":0.0087393249 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ki", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"ko", "task":"translation_to", "metric":"chrf", - "score":0.0 + "score":0.0221958957 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"kk", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"mr", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"kk", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.1666068635 + "score":0.1016207551 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"kk", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.4554883841 + "score":0.1937396468 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"kk", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"mr", "task":"translation_to", "metric":"bleu", - "score":0.1547742726 + "score":0.0232755836 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"kk", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"mr", "task":"translation_to", "metric":"chrf", - "score":0.4534139462 + "score":0.0683476995 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"km", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"pa", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"km", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.2647824193 + "score":0.3259062344 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"km", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.5269086196 + "score":0.4538874381 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"km", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"pa", "task":"translation_to", "metric":"bleu", - "score":0.1635334444 + "score":0.1871393365 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"km", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"pa", "task":"translation_to", "metric":"chrf", - "score":0.3431273828 + "score":0.2200892244 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"kn", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"pt", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"kn", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.247746183 + "score":0.1406086157 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"kn", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.506339637 + "score":0.2057127554 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"kn", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.1775009719 + "score":0.2664628529 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"kn", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.4300321597 + "score":0.3035324696 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ko", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"ru", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ko", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"ru", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"ru", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ko", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.2402657185 + "score":0.1104161719 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ko", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.497198112 + "score":0.2301836625 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ko", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"ru", "task":"translation_to", "metric":"bleu", - "score":0.3100527074 + "score":0.185463581 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ko", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"ru", "task":"translation_to", "metric":"chrf", - "score":0.3696197774 + "score":0.2585022568 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"lua", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"sw", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"lua", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"sw", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.0872330227 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"lua", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.3059813913 + "score":0.0271861792 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"lua", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"sw", "task":"translation_to", "metric":"bleu", - "score":0.0010116202 + "score":0.1476512664 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"lua", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"sw", "task":"translation_to", "metric":"chrf", - "score":0.1893341465 + "score":0.3192760623 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mag", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"ta", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mag", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"ta", "task":"translation_from", "metric":"bleu", - "score":0.3447519877 + "score":0.2136207431 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mag", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"ta", "task":"translation_from", "metric":"chrf", - "score":0.578789784 + "score":0.3120102842 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mag", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"ta", "task":"translation_to", "metric":"bleu", - "score":0.2508560655 + "score":0.114908602 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mag", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"ta", "task":"translation_to", "metric":"chrf", - "score":0.4987822313 + "score":0.1409558682 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mai", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"te", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mai", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"te", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.2732982319 + "score":0.1209511429 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mai", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.5233285219 + "score":0.1906473928 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mai", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"te", "task":"translation_to", "metric":"bleu", - "score":0.137657899 + "score":0.1356783563 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mai", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"te", "task":"translation_to", "metric":"chrf", - "score":0.3935929024 + "score":0.2003050615 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mg", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"tr", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mg", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"tr", "task":"mmlu", "metric":"accuracy", - "score":0.4 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mg", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"tr", "task":"translation_from", "metric":"bleu", - "score":0.2082275626 + "score":0.0658153186 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mg", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"tr", "task":"translation_from", "metric":"chrf", - "score":0.4639776287 + "score":0.1043402283 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mg", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"tr", "task":"translation_to", "metric":"bleu", - "score":0.1350252624 + "score":0.2785590215 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mg", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"tr", "task":"translation_to", "metric":"chrf", - "score":0.4834543859 + "score":0.3929421464 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ml", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"ur", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ml", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":0.2600500491 + "score":0.1341611323 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ml", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":0.5029669853 + "score":0.2099852043 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ml", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"ur", "task":"translation_to", "metric":"bleu", - "score":0.2091322046 + "score":0.0532408841 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ml", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"ur", "task":"translation_to", "metric":"chrf", - "score":0.4711774201 + "score":0.0792848959 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"vi", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.2256246926 + "score":0.2017921323 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.4703189943 + "score":0.2758120522 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"vi", "task":"translation_to", "metric":"bleu", - "score":0.2254492518 + "score":0.2703866537 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"mr", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"vi", "task":"translation_to", "metric":"chrf", - "score":0.447826525 + "score":0.3348006046 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ms", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"wuu", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ms", - "task":"mmlu", - "metric":"accuracy", - "score":0.5 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ms", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"wuu", "task":"translation_from", "metric":"bleu", - "score":0.2986303081 + "score":0.0272258942 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ms", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"wuu", "task":"translation_from", "metric":"chrf", - "score":0.5546917725 + "score":0.0804193027 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ms", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"wuu", "task":"translation_to", "metric":"bleu", - "score":0.3680194341 + "score":0.0083321447 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"ms", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"wuu", "task":"translation_to", "metric":"chrf", - "score":0.6778287705 + "score":0.01475986 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"my", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"yue", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"my", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"yue", "task":"translation_from", "metric":"bleu", - "score":0.1979480779 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"my", + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"yue", "task":"translation_from", "metric":"chrf", - "score":0.4791457508 + "score":0.0562014737 + }, + { + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"yue", + "task":"translation_to", + "metric":"bleu", + "score":0.0400341425 + }, + { + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"yue", + "task":"translation_to", + "metric":"chrf", + "score":0.0738358517 + }, + { + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"zh", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"zh", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"zh", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"zh", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"zh", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview", + "bcp_47":"zh", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"aeb", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"bleu", + "score":0.0278093886 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"chrf", + "score":0.1209403877 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"bleu", + "score":0.0460469917 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"chrf", + "score":0.1583874959 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"af", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"af", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"af", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"af", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"af", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ak", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ak", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ak", + "task":"translation_from", + "metric":"bleu", + "score":0.0746358572 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ak", + "task":"translation_from", + "metric":"chrf", + "score":0.2039454163 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ak", + "task":"translation_to", + "metric":"bleu", + "score":0.0106555853 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ak", + "task":"translation_to", + "metric":"chrf", + "score":0.1635891431 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"am", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"am", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"am", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"am", + "task":"translation_from", + "metric":"bleu", + "score":0.0987853648 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"am", + "task":"translation_from", + "metric":"chrf", + "score":0.2172965208 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"am", + "task":"translation_to", + "metric":"bleu", + "score":0.0037326563 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"am", + "task":"translation_to", + "metric":"chrf", + "score":0.0273289802 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"apc", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"apc", + "task":"translation_from", + "metric":"bleu", + "score":0.0349474752 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"apc", + "task":"translation_from", + "metric":"chrf", + "score":0.205929391 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"apc", + "task":"translation_to", + "metric":"bleu", + "score":0.0109943205 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"apc", + "task":"translation_to", + "metric":"chrf", + "score":0.1135056868 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ar", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ar", + "task":"translation_from", + "metric":"bleu", + "score":0.0231513455 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ar", + "task":"translation_from", + "metric":"chrf", + "score":0.1669816885 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ar", + "task":"translation_to", + "metric":"bleu", + "score":0.0192052173 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ar", + "task":"translation_to", + "metric":"chrf", + "score":0.1199941852 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ary", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ary", + "task":"translation_from", + "metric":"bleu", + "score":0.0482644911 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ary", + "task":"translation_from", + "metric":"chrf", + "score":0.1570610957 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ary", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ary", + "task":"translation_to", + "metric":"chrf", + "score":0.0671140896 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"arz", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"arz", + "task":"translation_from", + "metric":"bleu", + "score":0.0333540125 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"arz", + "task":"translation_from", + "metric":"chrf", + "score":0.1654807425 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"arz", + "task":"translation_to", + "metric":"bleu", + "score":0.0300458941 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"arz", + "task":"translation_to", + "metric":"chrf", + "score":0.1417391491 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"as", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"as", + "task":"translation_from", + "metric":"bleu", + "score":0.0153668157 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"as", + "task":"translation_from", + "metric":"chrf", + "score":0.1119995149 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"as", + "task":"translation_to", + "metric":"bleu", + "score":0.0988733729 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"as", + "task":"translation_to", + "metric":"chrf", + "score":0.2096173766 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"awa", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"awa", + "task":"translation_from", + "metric":"bleu", + "score":0.0696643378 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"awa", + "task":"translation_from", + "metric":"chrf", + "score":0.1931858455 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"awa", + "task":"translation_to", + "metric":"bleu", + "score":0.0309816185 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"awa", + "task":"translation_to", + "metric":"chrf", + "score":0.1018697927 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"az", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"az", + "task":"translation_from", + "metric":"bleu", + "score":0.0634083235 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"az", + "task":"translation_from", + "metric":"chrf", + "score":0.1819427877 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"az", + "task":"translation_to", + "metric":"bleu", + "score":0.0728528728 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"az", + "task":"translation_to", + "metric":"chrf", + "score":0.2068099712 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"be", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"be", + "task":"translation_from", + "metric":"bleu", + "score":0.0726648889 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"be", + "task":"translation_from", + "metric":"chrf", + "score":0.2430791182 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"be", + "task":"translation_to", + "metric":"bleu", + "score":0.0528414924 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"be", + "task":"translation_to", + "metric":"chrf", + "score":0.1724803068 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bho", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bho", + "task":"translation_from", + "metric":"bleu", + "score":0.1903946317 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bho", + "task":"translation_from", + "metric":"chrf", + "score":0.3145924631 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bho", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bho", + "task":"translation_to", + "metric":"chrf", + "score":0.0310651444 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bm", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bm", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bm", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bm", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bm", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bn", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bn", + "task":"translation_from", + "metric":"bleu", + "score":0.0425897525 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bn", + "task":"translation_from", + "metric":"chrf", + "score":0.1329517484 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bn", + "task":"translation_to", + "metric":"bleu", + "score":0.1071842556 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"bn", + "task":"translation_to", + "metric":"chrf", + "score":0.2292182808 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ca", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ca", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ca", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ca", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ca", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ceb", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"bleu", + "score":0.1295041316 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"chrf", + "score":0.2647572228 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"bleu", + "score":0.0551171959 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"chrf", + "score":0.2019792449 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ckb", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"bleu", + "score":0.1181725504 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"chrf", + "score":0.3417239653 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"bleu", + "score":0.0030057917 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"chrf", + "score":0.050016858 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"cs", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"cs", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"cs", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"cs", + "task":"translation_from", + "metric":"bleu", + "score":0.1106488773 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"cs", + "task":"translation_from", + "metric":"chrf", + "score":0.2661126449 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"cs", + "task":"translation_to", + "metric":"bleu", + "score":0.0566112691 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"cs", + "task":"translation_to", + "metric":"chrf", + "score":0.2161355093 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"de", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"de", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"de", + "task":"translation_from", + "metric":"bleu", + "score":0.1071586446 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"de", + "task":"translation_from", + "metric":"chrf", + "score":0.2867516145 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"de", + "task":"translation_to", + "metric":"bleu", + "score":0.1380160311 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"de", + "task":"translation_to", + "metric":"chrf", + "score":0.3472666619 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"el", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"el", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"el", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"el", + "task":"translation_from", + "metric":"bleu", + "score":0.1228102479 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"el", + "task":"translation_from", + "metric":"chrf", + "score":0.257059719 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"el", + "task":"translation_to", + "metric":"bleu", + "score":0.0709906394 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"el", + "task":"translation_to", + "metric":"chrf", + "score":0.1615768924 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"en", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"en", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"en", + "task":"translation_from", + "metric":"bleu", + "score":0.3271580119 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"en", + "task":"translation_from", + "metric":"chrf", + "score":0.4059591673 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"en", + "task":"translation_to", + "metric":"bleu", + "score":0.4705724484 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"en", + "task":"translation_to", + "metric":"chrf", + "score":0.5810510479 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"es", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"es", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"es", + "task":"translation_from", + "metric":"bleu", + "score":0.0612440394 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"es", + "task":"translation_from", + "metric":"chrf", + "score":0.214820597 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"es", + "task":"translation_to", + "metric":"bleu", + "score":0.0718408174 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"es", + "task":"translation_to", + "metric":"chrf", + "score":0.2974455623 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fa", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fa", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fa", + "task":"translation_from", + "metric":"bleu", + "score":0.1093307519 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fa", + "task":"translation_from", + "metric":"chrf", + "score":0.2212819207 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fa", + "task":"translation_to", + "metric":"bleu", + "score":0.0461058798 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fa", + "task":"translation_to", + "metric":"chrf", + "score":0.1370841628 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fil", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fil", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fil", + "task":"translation_from", + "metric":"bleu", + "score":0.1005924157 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fil", + "task":"translation_from", + "metric":"chrf", + "score":0.202708484 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fil", + "task":"translation_to", + "metric":"bleu", + "score":0.0160833262 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fil", + "task":"translation_to", + "metric":"chrf", + "score":0.1960110619 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fr", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fr", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fr", + "task":"translation_from", + "metric":"bleu", + "score":0.1269813968 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fr", + "task":"translation_from", + "metric":"chrf", + "score":0.3065913664 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fr", + "task":"translation_to", + "metric":"bleu", + "score":0.1789987295 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fr", + "task":"translation_to", + "metric":"chrf", + "score":0.3463028707 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fuv", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"bleu", + "score":0.014745965 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"chrf", + "score":0.0749091363 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"chrf", + "score":0.0895914252 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"gu", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"gu", + "task":"translation_from", + "metric":"bleu", + "score":0.097971755 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"gu", + "task":"translation_from", + "metric":"chrf", + "score":0.1777195033 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"gu", + "task":"translation_to", + "metric":"bleu", + "score":0.0318870555 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"gu", + "task":"translation_to", + "metric":"chrf", + "score":0.1529629731 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ha", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ha", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ha", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ha", + "task":"translation_from", + "metric":"bleu", + "score":0.0369448389 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ha", + "task":"translation_from", + "metric":"chrf", + "score":0.1480560277 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ha", + "task":"translation_to", + "metric":"bleu", + "score":0.0919802251 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ha", + "task":"translation_to", + "metric":"chrf", + "score":0.2629251679 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hi", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hi", + "task":"translation_from", + "metric":"bleu", + "score":0.2538230452 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hi", + "task":"translation_from", + "metric":"chrf", + "score":0.3759994265 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hi", + "task":"translation_to", + "metric":"bleu", + "score":0.0835774684 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hi", + "task":"translation_to", + "metric":"chrf", + "score":0.1904298158 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hne", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hne", + "task":"translation_from", + "metric":"bleu", + "score":0.0800273183 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hne", + "task":"translation_from", + "metric":"chrf", + "score":0.2260677118 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hne", + "task":"translation_to", + "metric":"bleu", + "score":0.0220446366 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hne", + "task":"translation_to", + "metric":"chrf", + "score":0.0997285023 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ht", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ht", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ht", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ht", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ht", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hu", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hu", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hu", + "task":"translation_from", + "metric":"bleu", + "score":0.0883989834 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hu", + "task":"translation_from", + "metric":"chrf", + "score":0.206785454 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hu", + "task":"translation_to", + "metric":"bleu", + "score":0.0790692679 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"hu", + "task":"translation_to", + "metric":"chrf", + "score":0.28304649 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"id", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"id", + "task":"translation_from", + "metric":"bleu", + "score":0.0773479102 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"id", + "task":"translation_from", + "metric":"chrf", + "score":0.2587381281 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"id", + "task":"translation_to", + "metric":"bleu", + "score":0.0433423647 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"id", + "task":"translation_to", + "metric":"chrf", + "score":0.2817069358 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ig", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ig", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ig", + "task":"translation_from", + "metric":"bleu", + "score":0.0612163002 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ig", + "task":"translation_from", + "metric":"chrf", + "score":0.2381342912 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ig", + "task":"translation_to", + "metric":"bleu", + "score":0.0426402139 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ig", + "task":"translation_to", + "metric":"chrf", + "score":0.1696737174 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ilo", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"bleu", + "score":0.0970247032 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"chrf", + "score":0.2111718332 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"bleu", + "score":0.0050070462 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"chrf", + "score":0.1683969558 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"it", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"it", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"it", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"it", + "task":"translation_from", + "metric":"bleu", + "score":0.139001615 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"it", + "task":"translation_from", + "metric":"chrf", + "score":0.2668336456 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"it", + "task":"translation_to", + "metric":"bleu", + "score":0.0475935646 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"it", + "task":"translation_to", + "metric":"chrf", + "score":0.2602541027 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ja", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ja", + "task":"translation_from", + "metric":"bleu", + "score":0.0609909305 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ja", + "task":"translation_from", + "metric":"chrf", + "score":0.1860226608 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ja", + "task":"translation_to", + "metric":"bleu", + "score":0.0692256682 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ja", + "task":"translation_to", + "metric":"chrf", + "score":0.1449932716 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"jv", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"jv", + "task":"translation_from", + "metric":"bleu", + "score":0.0495085803 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"jv", + "task":"translation_from", + "metric":"chrf", + "score":0.1459303026 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"jv", + "task":"translation_to", + "metric":"bleu", + "score":0.0098682093 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"jv", + "task":"translation_to", + "metric":"chrf", + "score":0.1292642853 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ki", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ki", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ki", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ki", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ki", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"kk", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"kk", + "task":"translation_from", + "metric":"bleu", + "score":0.0827091376 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"kk", + "task":"translation_from", + "metric":"chrf", + "score":0.2337306985 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"kk", + "task":"translation_to", + "metric":"bleu", + "score":0.0492400989 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"kk", + "task":"translation_to", + "metric":"chrf", + "score":0.155912411 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"km", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"km", + "task":"translation_from", + "metric":"bleu", + "score":0.0860125484 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"km", + "task":"translation_from", + "metric":"chrf", + "score":0.1623830923 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"km", + "task":"translation_to", + "metric":"bleu", + "score":0.0024514101 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"km", + "task":"translation_to", + "metric":"chrf", + "score":0.0781695805 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"kn", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"kn", + "task":"translation_from", + "metric":"bleu", + "score":0.0937784828 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"kn", + "task":"translation_from", + "metric":"chrf", + "score":0.2195953032 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"kn", + "task":"translation_to", + "metric":"bleu", + "score":0.0577688436 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"kn", + "task":"translation_to", + "metric":"chrf", + "score":0.1510063998 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ko", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ko", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ko", + "task":"translation_from", + "metric":"bleu", + "score":0.0680252346 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ko", + "task":"translation_from", + "metric":"chrf", + "score":0.2091636742 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ko", + "task":"translation_to", + "metric":"bleu", + "score":0.0555477009 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ko", + "task":"translation_to", + "metric":"chrf", + "score":0.0549298013 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"lua", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"lua", + "task":"translation_from", + "metric":"bleu", + "score":0.0036630043 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"lua", + "task":"translation_from", + "metric":"chrf", + "score":0.099240382 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"lua", + "task":"translation_to", + "metric":"bleu", + "score":0.0532977337 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"lua", + "task":"translation_to", + "metric":"chrf", + "score":0.2153600503 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mag", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mag", + "task":"translation_from", + "metric":"bleu", + "score":0.1425685645 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mag", + "task":"translation_from", + "metric":"chrf", + "score":0.3016796517 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mag", + "task":"translation_to", + "metric":"bleu", + "score":0.0118929014 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mag", + "task":"translation_to", + "metric":"chrf", + "score":0.0840825564 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mai", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mai", + "task":"translation_from", + "metric":"bleu", + "score":0.115229855 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mai", + "task":"translation_from", + "metric":"chrf", + "score":0.2180450998 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mai", + "task":"translation_to", + "metric":"bleu", + "score":0.0163179059 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mai", + "task":"translation_to", + "metric":"chrf", + "score":0.0417840087 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mg", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mg", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mg", + "task":"translation_from", + "metric":"bleu", + "score":0.0410364581 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mg", + "task":"translation_from", + "metric":"chrf", + "score":0.2193286405 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mg", + "task":"translation_to", + "metric":"bleu", + "score":0.0422799242 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mg", + "task":"translation_to", + "metric":"chrf", + "score":0.1425526516 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ml", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ml", + "task":"translation_from", + "metric":"bleu", + "score":0.0630918824 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ml", + "task":"translation_from", + "metric":"chrf", + "score":0.1710971727 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ml", + "task":"translation_to", + "metric":"bleu", + "score":0.0386225926 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ml", + "task":"translation_to", + "metric":"chrf", + "score":0.1445595523 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mr", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mr", + "task":"translation_from", + "metric":"bleu", + "score":0.1084731704 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mr", + "task":"translation_from", + "metric":"chrf", + "score":0.2498733805 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mr", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"mr", + "task":"translation_to", + "metric":"chrf", + "score":0.0399406962 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ms", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ms", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ms", + "task":"translation_from", + "metric":"bleu", + "score":0.033427329 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ms", + "task":"translation_from", + "metric":"chrf", + "score":0.1616696801 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ms", + "task":"translation_to", + "metric":"bleu", + "score":0.115786224 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ms", + "task":"translation_to", + "metric":"chrf", + "score":0.3018549986 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"my", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"my", + "task":"translation_from", + "metric":"bleu", + "score":0.2294643956 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"my", + "task":"translation_from", + "metric":"chrf", + "score":0.3457333311 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"my", + "task":"translation_to", + "metric":"bleu", + "score":0.1065767565 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"my", + "task":"translation_to", + "metric":"chrf", + "score":0.2047469752 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ne", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ne", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ne", + "task":"translation_from", + "metric":"bleu", + "score":0.0951128399 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ne", + "task":"translation_from", + "metric":"chrf", + "score":0.2178534884 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ne", + "task":"translation_to", + "metric":"bleu", + "score":0.0398161454 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ne", + "task":"translation_to", + "metric":"chrf", + "score":0.1412294262 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"nl", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"nl", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"nl", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"nl", + "task":"translation_from", + "metric":"bleu", + "score":0.0563796721 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"nl", + "task":"translation_from", + "metric":"chrf", + "score":0.1918127836 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"nl", + "task":"translation_to", + "metric":"bleu", + "score":0.0887408505 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"nl", + "task":"translation_to", + "metric":"chrf", + "score":0.3444852597 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ny", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ny", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ny", + "task":"translation_from", + "metric":"bleu", + "score":0.0322569074 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ny", + "task":"translation_from", + "metric":"chrf", + "score":0.1681655692 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ny", + "task":"translation_to", + "metric":"bleu", + "score":0.0133097605 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ny", + "task":"translation_to", + "metric":"chrf", + "score":0.1890356187 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"om", + "task":"classification", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"om", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"om", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"om", + "task":"translation_from", + "metric":"bleu", + "score":0.0380467697 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"om", + "task":"translation_from", + "metric":"chrf", + "score":0.11665963 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"om", + "task":"translation_to", + "metric":"bleu", + "score":0.0196821089 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"om", + "task":"translation_to", + "metric":"chrf", + "score":0.1887330103 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"or", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"or", + "task":"translation_from", + "metric":"bleu", + "score":0.0987048471 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"or", + "task":"translation_from", + "metric":"chrf", + "score":0.2474195062 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"or", + "task":"translation_to", + "metric":"bleu", + "score":0.0246921682 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"or", + "task":"translation_to", + "metric":"chrf", + "score":0.1089265139 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pa", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pa", + "task":"translation_from", + "metric":"bleu", + "score":0.2220426626 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pa", + "task":"translation_from", + "metric":"chrf", + "score":0.3598952341 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pa", + "task":"translation_to", + "metric":"bleu", + "score":0.1611882376 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pa", + "task":"translation_to", + "metric":"chrf", + "score":0.2396561128 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pl", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pl", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pl", + "task":"translation_from", + "metric":"bleu", + "score":0.0904332342 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pl", + "task":"translation_from", + "metric":"chrf", + "score":0.2068730334 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pl", + "task":"translation_to", + "metric":"bleu", + "score":0.046065351 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pl", + "task":"translation_to", + "metric":"chrf", + "score":0.1925827805 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pt", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pt", + "task":"translation_from", + "metric":"bleu", + "score":0.1079576302 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pt", + "task":"translation_from", + "metric":"chrf", + "score":0.2645017017 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pt", + "task":"translation_to", + "metric":"bleu", + "score":0.0569295003 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"pt", + "task":"translation_to", + "metric":"chrf", + "score":0.2615431845 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ro", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ro", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ro", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ro", + "task":"translation_from", + "metric":"bleu", + "score":0.131593328 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ro", + "task":"translation_from", + "metric":"chrf", + "score":0.3060223321 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ro", + "task":"translation_to", + "metric":"bleu", + "score":0.0757294413 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ro", + "task":"translation_to", + "metric":"chrf", + "score":0.2150897212 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ru", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ru", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ru", + "task":"translation_from", + "metric":"bleu", + "score":0.0926690761 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ru", + "task":"translation_from", + "metric":"chrf", + "score":0.2397253952 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ru", + "task":"translation_to", + "metric":"bleu", + "score":0.1044259789 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ru", + "task":"translation_to", + "metric":"chrf", + "score":0.236302624 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"rw", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"rw", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"rw", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"rw", + "task":"translation_from", + "metric":"bleu", + "score":0.0153852885 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"rw", + "task":"translation_from", + "metric":"chrf", + "score":0.1605190155 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"rw", + "task":"translation_to", + "metric":"bleu", + "score":0.0600552316 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"rw", + "task":"translation_to", + "metric":"chrf", + "score":0.2182309051 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sd", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sd", + "task":"translation_from", + "metric":"bleu", + "score":0.120327349 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sd", + "task":"translation_from", + "metric":"chrf", + "score":0.2042820289 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sd", + "task":"translation_to", + "metric":"bleu", + "score":0.0309396387 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sd", + "task":"translation_to", + "metric":"chrf", + "score":0.1043645846 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"si", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"si", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"si", + "task":"translation_from", + "metric":"bleu", + "score":0.0861987344 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"si", + "task":"translation_from", + "metric":"chrf", + "score":0.2079338406 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"si", + "task":"translation_to", + "metric":"bleu", + "score":0.0196434254 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"si", + "task":"translation_to", + "metric":"chrf", + "score":0.0610643505 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sn", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sn", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sn", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sn", + "task":"translation_from", + "metric":"bleu", + "score":0.0320247445 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sn", + "task":"translation_from", + "metric":"chrf", + "score":0.2176774161 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sn", + "task":"translation_to", + "metric":"bleu", + "score":0.0700005142 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sn", + "task":"translation_to", + "metric":"chrf", + "score":0.1952413901 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"so", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"so", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"so", + "task":"translation_from", + "metric":"bleu", + "score":0.0252575003 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"so", + "task":"translation_from", + "metric":"chrf", + "score":0.157057904 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"so", + "task":"translation_to", + "metric":"bleu", + "score":0.0629444831 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"so", + "task":"translation_to", + "metric":"chrf", + "score":0.1833979697 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sr", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sr", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sr", + "task":"translation_from", + "metric":"bleu", + "score":0.0868186974 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sr", + "task":"translation_from", + "metric":"chrf", + "score":0.2586575848 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sr", + "task":"translation_to", + "metric":"bleu", + "score":0.1093378877 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sr", + "task":"translation_to", + "metric":"chrf", + "score":0.2502315423 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"su", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"su", + "task":"translation_from", + "metric":"bleu", + "score":0.0782352762 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"su", + "task":"translation_from", + "metric":"chrf", + "score":0.2378174872 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"su", + "task":"translation_to", + "metric":"bleu", + "score":0.0338179306 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"su", + "task":"translation_to", + "metric":"chrf", + "score":0.2284098709 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sv", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sv", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sv", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sv", + "task":"translation_from", + "metric":"bleu", + "score":0.1179976804 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sv", + "task":"translation_from", + "metric":"chrf", + "score":0.2633320797 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sv", + "task":"translation_to", + "metric":"bleu", + "score":0.0494945427 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sv", + "task":"translation_to", + "metric":"chrf", + "score":0.2411403917 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sw", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sw", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sw", + "task":"translation_from", + "metric":"bleu", + "score":0.1282740208 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sw", + "task":"translation_from", + "metric":"chrf", + "score":0.2521886667 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sw", + "task":"translation_to", + "metric":"bleu", + "score":0.0748708455 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"sw", + "task":"translation_to", + "metric":"chrf", + "score":0.2420611826 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ta", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ta", + "task":"translation_from", + "metric":"bleu", + "score":0.1073230839 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ta", + "task":"translation_from", + "metric":"chrf", + "score":0.1798254279 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ta", + "task":"translation_to", + "metric":"bleu", + "score":0.0317538654 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ta", + "task":"translation_to", + "metric":"chrf", + "score":0.2038003362 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"te", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"te", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"te", + "task":"translation_from", + "metric":"bleu", + "score":0.1951561832 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"te", + "task":"translation_from", + "metric":"chrf", + "score":0.3697480899 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"te", + "task":"translation_to", + "metric":"bleu", + "score":0.1899598166 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"te", + "task":"translation_to", + "metric":"chrf", + "score":0.2894416622 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"tg", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"tg", + "task":"translation_from", + "metric":"bleu", + "score":0.0653258846 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"tg", + "task":"translation_from", + "metric":"chrf", + "score":0.2205970586 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"tg", + "task":"translation_to", + "metric":"bleu", + "score":0.0222271283 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"tg", + "task":"translation_to", + "metric":"chrf", + "score":0.120000505 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"th", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"th", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"th", + "task":"translation_from", + "metric":"bleu", + "score":0.1262768628 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"th", + "task":"translation_from", + "metric":"chrf", + "score":0.2570885899 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"th", + "task":"translation_to", + "metric":"bleu", + "score":0.0575688551 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"th", + "task":"translation_to", + "metric":"chrf", + "score":0.1582234491 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ti", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ti", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ti", + "task":"translation_from", + "metric":"chrf", + "score":0.062613791 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ti", + "task":"translation_to", + "metric":"bleu", + "score":0.0059519046 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ti", + "task":"translation_to", + "metric":"chrf", + "score":0.0274291267 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"tr", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"tr", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"tr", + "task":"translation_from", + "metric":"bleu", + "score":0.0337787053 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"tr", + "task":"translation_from", + "metric":"chrf", + "score":0.1824544035 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"tr", + "task":"translation_to", + "metric":"bleu", + "score":0.1405643754 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"tr", + "task":"translation_to", + "metric":"chrf", + "score":0.281387297 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"uk", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"uk", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"uk", + "task":"translation_from", + "metric":"bleu", + "score":0.1091041441 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"uk", + "task":"translation_from", + "metric":"chrf", + "score":0.2184696361 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"uk", + "task":"translation_to", + "metric":"bleu", + "score":0.1508474535 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"uk", + "task":"translation_to", + "metric":"chrf", + "score":0.234056096 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"umb", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"umb", + "task":"translation_from", + "metric":"bleu", + "score":0.0058005929 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"umb", + "task":"translation_from", + "metric":"chrf", + "score":0.0841095708 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"umb", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"umb", + "task":"translation_to", + "metric":"chrf", + "score":0.1328221884 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ur", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ur", + "task":"translation_from", + "metric":"bleu", + "score":0.1386027419 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ur", + "task":"translation_from", + "metric":"chrf", + "score":0.3084595255 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ur", + "task":"translation_to", + "metric":"bleu", + "score":0.0167447692 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"ur", + "task":"translation_to", + "metric":"chrf", + "score":0.0960347815 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"uz", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"uz", + "task":"translation_from", + "metric":"bleu", + "score":0.0342337572 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"uz", + "task":"translation_from", + "metric":"chrf", + "score":0.1153353221 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"uz", + "task":"translation_to", + "metric":"bleu", + "score":0.0694684605 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"uz", + "task":"translation_to", + "metric":"chrf", + "score":0.2369528571 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"vi", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"vi", + "task":"translation_from", + "metric":"bleu", + "score":0.1615259525 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"vi", + "task":"translation_from", + "metric":"chrf", + "score":0.2808117936 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"vi", + "task":"translation_to", + "metric":"bleu", + "score":0.1251511875 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"vi", + "task":"translation_to", + "metric":"chrf", + "score":0.3058766946 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"wo", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"wo", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"wo", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"wo", + "task":"translation_from", + "metric":"bleu", + "score":0.0065958006 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"wo", + "task":"translation_from", + "metric":"chrf", + "score":0.0642484091 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"wo", + "task":"translation_to", + "metric":"bleu", + "score":0.0043862302 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"wo", + "task":"translation_to", + "metric":"chrf", + "score":0.1616631945 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"wuu", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"bleu", + "score":0.0666328001 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"chrf", + "score":0.2282939681 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"bleu", + "score":0.0063550665 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"chrf", + "score":0.0402314549 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"xh", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"xh", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"xh", + "task":"translation_from", + "metric":"bleu", + "score":0.0731036446 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"xh", + "task":"translation_from", + "metric":"chrf", + "score":0.1810894045 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"xh", + "task":"translation_to", + "metric":"bleu", + "score":0.0117190064 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"xh", + "task":"translation_to", + "metric":"chrf", + "score":0.1631103727 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"yo", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"yo", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"yo", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"yo", + "task":"translation_from", + "metric":"bleu", + "score":0.058648798 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"yo", + "task":"translation_from", + "metric":"chrf", + "score":0.162917811 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"yo", + "task":"translation_to", + "metric":"bleu", + "score":0.0647492243 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"yo", + "task":"translation_to", + "metric":"chrf", + "score":0.1522863767 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"yue", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"yue", + "task":"translation_from", + "metric":"bleu", + "score":0.1133445002 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"yue", + "task":"translation_from", + "metric":"chrf", + "score":0.2630654346 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"yue", + "task":"translation_to", + "metric":"bleu", + "score":0.0177899901 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"yue", + "task":"translation_to", + "metric":"chrf", + "score":0.0452074918 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"zh", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"zh", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"zh", + "task":"translation_from", + "metric":"bleu", + "score":0.0949407188 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"zh", + "task":"translation_from", + "metric":"chrf", + "score":0.2042376654 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"zh", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"zh", + "task":"translation_to", + "metric":"chrf", + "score":0.0169223477 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"zu", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"zu", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"zu", + "task":"mmlu", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"zu", + "task":"translation_from", + "metric":"bleu", + "score":0.0689235431 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"zu", + "task":"translation_from", + "metric":"chrf", + "score":0.2000811037 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"zu", + "task":"translation_to", + "metric":"bleu", + "score":0.0413489342 + }, + { + "model":"google\/gemini-2.5-pro-preview-05-06", + "bcp_47":"zu", + "task":"translation_to", + "metric":"chrf", + "score":0.1904482997 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"aeb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"bleu", + "score":0.2073802913 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"chrf", + "score":0.4889223975 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"bleu", + "score":0.0840656979 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"chrf", + "score":0.3453561943 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"af", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"af", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"af", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"af", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"af", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ak", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ak", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ak", + "task":"translation_from", + "metric":"bleu", + "score":0.120094546 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ak", + "task":"translation_from", + "metric":"chrf", + "score":0.3259782194 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ak", + "task":"translation_to", + "metric":"bleu", + "score":0.0974181135 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ak", + "task":"translation_to", + "metric":"chrf", + "score":0.3477814679 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"am", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"am", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"am", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"am", + "task":"translation_from", + "metric":"bleu", + "score":0.2393172056 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"am", + "task":"translation_from", + "metric":"chrf", + "score":0.4971254293 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"am", + "task":"translation_to", + "metric":"bleu", + "score":0.2089212841 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"am", + "task":"translation_to", + "metric":"chrf", + "score":0.3406916002 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"apc", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"apc", + "task":"translation_from", + "metric":"bleu", + "score":0.2712045148 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"apc", + "task":"translation_from", + "metric":"chrf", + "score":0.5477096036 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"apc", + "task":"translation_to", + "metric":"bleu", + "score":0.178052271 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"apc", + "task":"translation_to", + "metric":"chrf", + "score":0.468064885 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ar", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ar", + "task":"translation_from", + "metric":"bleu", + "score":0.2747843596 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ar", + "task":"translation_from", + "metric":"chrf", + "score":0.5519960681 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ar", + "task":"translation_to", + "metric":"bleu", + "score":0.2863967069 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ar", + "task":"translation_to", + "metric":"chrf", + "score":0.5318173199 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ary", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ary", + "task":"translation_from", + "metric":"bleu", + "score":0.1096694862 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ary", + "task":"translation_from", + "metric":"chrf", + "score":0.4291604898 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ary", + "task":"translation_to", + "metric":"bleu", + "score":0.1630720543 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ary", + "task":"translation_to", + "metric":"chrf", + "score":0.3952400339 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"arz", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"arz", + "task":"translation_from", + "metric":"bleu", + "score":0.1892846534 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"arz", + "task":"translation_from", + "metric":"chrf", + "score":0.4212342522 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"arz", + "task":"translation_to", + "metric":"bleu", + "score":0.1938470016 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"arz", + "task":"translation_to", + "metric":"chrf", + "score":0.4527968539 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"as", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"as", + "task":"translation_from", + "metric":"bleu", + "score":0.2094379574 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"as", + "task":"translation_from", + "metric":"chrf", + "score":0.4509809217 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"as", + "task":"translation_to", + "metric":"bleu", + "score":0.1931386564 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"as", + "task":"translation_to", + "metric":"chrf", + "score":0.4233010233 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"awa", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"awa", + "task":"translation_from", + "metric":"bleu", + "score":0.2957522582 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"awa", + "task":"translation_from", + "metric":"chrf", + "score":0.5232039352 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"awa", + "task":"translation_to", + "metric":"bleu", + "score":0.2308361669 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"awa", + "task":"translation_to", + "metric":"chrf", + "score":0.4087255612 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"az", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"az", + "task":"translation_from", + "metric":"bleu", + "score":0.200456445 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"az", + "task":"translation_from", + "metric":"chrf", + "score":0.4226152307 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"az", + "task":"translation_to", + "metric":"bleu", + "score":0.1414132922 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"az", + "task":"translation_to", + "metric":"chrf", + "score":0.4170843853 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"be", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"be", + "task":"translation_from", + "metric":"bleu", + "score":0.18522743 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"be", + "task":"translation_from", + "metric":"chrf", + "score":0.4467570037 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"be", + "task":"translation_to", + "metric":"bleu", + "score":0.2590661095 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"be", + "task":"translation_to", + "metric":"chrf", + "score":0.4657468506 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bho", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bho", + "task":"translation_from", + "metric":"bleu", + "score":0.2663307677 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bho", + "task":"translation_from", + "metric":"chrf", + "score":0.519985227 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bho", + "task":"translation_to", + "metric":"bleu", + "score":0.1913577407 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bho", + "task":"translation_to", + "metric":"chrf", + "score":0.4064669591 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bm", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bm", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bm", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bm", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bm", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bn", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bn", + "task":"translation_from", + "metric":"bleu", + "score":0.271237739 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bn", + "task":"translation_from", + "metric":"chrf", + "score":0.5173954387 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bn", + "task":"translation_to", + "metric":"bleu", + "score":0.3067537945 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"bn", + "task":"translation_to", + "metric":"chrf", + "score":0.5194482945 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ca", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ca", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ca", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ca", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ca", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ceb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"bleu", + "score":0.3694979709 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"chrf", + "score":0.59081536 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"bleu", + "score":0.374702944 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"chrf", + "score":0.6019503341 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ckb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"bleu", + "score":0.2792699678 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"chrf", + "score":0.5157552806 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"bleu", + "score":0.2334415639 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"chrf", + "score":0.5128705295 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"cs", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"cs", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"cs", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"cs", + "task":"translation_from", + "metric":"bleu", + "score":0.3536861453 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"cs", + "task":"translation_from", + "metric":"chrf", + "score":0.6024608455 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"cs", + "task":"translation_to", + "metric":"bleu", + "score":0.4031829559 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"cs", + "task":"translation_to", + "metric":"chrf", + "score":0.6234553711 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"de", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"de", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"de", + "task":"translation_from", + "metric":"bleu", + "score":0.3189602129 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"de", + "task":"translation_from", + "metric":"chrf", + "score":0.5548503533 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"de", + "task":"translation_to", + "metric":"bleu", + "score":0.5229096392 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"de", + "task":"translation_to", + "metric":"chrf", + "score":0.7023434262 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"el", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"el", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"el", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"el", + "task":"translation_from", + "metric":"bleu", + "score":0.3137252517 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"el", + "task":"translation_from", + "metric":"chrf", + "score":0.5147981205 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"el", + "task":"translation_to", + "metric":"bleu", + "score":0.3302929673 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"el", + "task":"translation_to", + "metric":"chrf", + "score":0.505425141 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"en", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"en", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"en", + "task":"translation_from", + "metric":"bleu", + "score":0.3889146477 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"en", + "task":"translation_from", + "metric":"chrf", + "score":0.628092835 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"en", + "task":"translation_to", + "metric":"bleu", + "score":0.4660772497 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"en", + "task":"translation_to", + "metric":"chrf", + "score":0.7280386297 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"es", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"es", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"es", + "task":"translation_from", + "metric":"bleu", + "score":0.3593767686 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"es", + "task":"translation_from", + "metric":"chrf", + "score":0.5668073679 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"es", + "task":"translation_to", + "metric":"bleu", + "score":0.3662275621 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"es", + "task":"translation_to", + "metric":"chrf", + "score":0.6102640711 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fa", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fa", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fa", + "task":"translation_from", + "metric":"bleu", + "score":0.286051969 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fa", + "task":"translation_from", + "metric":"chrf", + "score":0.5373856549 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fa", + "task":"translation_to", + "metric":"bleu", + "score":0.1816947237 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fa", + "task":"translation_to", + "metric":"chrf", + "score":0.3981159206 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fil", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fil", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fil", + "task":"translation_from", + "metric":"bleu", + "score":0.3579818144 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fil", + "task":"translation_from", + "metric":"chrf", + "score":0.5889481625 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fil", + "task":"translation_to", + "metric":"bleu", + "score":0.3403832088 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fil", + "task":"translation_to", + "metric":"chrf", + "score":0.590264879 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fr", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fr", + "task":"translation_from", + "metric":"bleu", + "score":0.3180384008 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fr", + "task":"translation_from", + "metric":"chrf", + "score":0.5571267732 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fr", + "task":"translation_to", + "metric":"bleu", + "score":0.5778354146 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fr", + "task":"translation_to", + "metric":"chrf", + "score":0.7490356238 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fuv", + "task":"classification", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"bleu", + "score":0.0380719948 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"chrf", + "score":0.2066039108 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"bleu", + "score":0.0259757351 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"chrf", + "score":0.147148937 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"gu", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"gu", + "task":"translation_from", + "metric":"bleu", + "score":0.34811918 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"gu", + "task":"translation_from", + "metric":"chrf", + "score":0.5482709715 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"gu", + "task":"translation_to", + "metric":"bleu", + "score":0.1618983325 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"gu", + "task":"translation_to", + "metric":"chrf", + "score":0.4411905252 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ha", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ha", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ha", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ha", + "task":"translation_from", + "metric":"bleu", + "score":0.1925315551 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ha", + "task":"translation_from", + "metric":"chrf", + "score":0.4032389241 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ha", + "task":"translation_to", + "metric":"bleu", + "score":0.1992720083 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ha", + "task":"translation_to", + "metric":"chrf", + "score":0.4905441802 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hi", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hi", + "task":"translation_from", + "metric":"bleu", + "score":0.3722751955 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hi", + "task":"translation_from", + "metric":"chrf", + "score":0.6207213131 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hi", + "task":"translation_to", + "metric":"bleu", + "score":0.3378499277 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hi", + "task":"translation_to", + "metric":"chrf", + "score":0.554090013 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hne", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hne", + "task":"translation_from", + "metric":"bleu", + "score":0.2879989689 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hne", + "task":"translation_from", + "metric":"chrf", + "score":0.5083598943 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hne", + "task":"translation_to", + "metric":"bleu", + "score":0.1719225434 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hne", + "task":"translation_to", + "metric":"chrf", + "score":0.3992950999 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ht", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ht", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ht", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ht", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ht", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hu", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hu", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hu", + "task":"translation_from", + "metric":"bleu", + "score":0.3234067809 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hu", + "task":"translation_from", + "metric":"chrf", + "score":0.5706707095 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hu", + "task":"translation_to", + "metric":"bleu", + "score":0.3187264685 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"hu", + "task":"translation_to", + "metric":"chrf", + "score":0.5856828402 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"id", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"id", + "task":"translation_from", + "metric":"bleu", + "score":0.3583744222 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"id", + "task":"translation_from", + "metric":"chrf", + "score":0.5732194975 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"id", + "task":"translation_to", + "metric":"bleu", + "score":0.3364664006 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"id", + "task":"translation_to", + "metric":"chrf", + "score":0.6438910651 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ig", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ig", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ig", + "task":"translation_from", + "metric":"bleu", + "score":0.225000401 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ig", + "task":"translation_from", + "metric":"chrf", + "score":0.4567066441 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ig", + "task":"translation_to", + "metric":"bleu", + "score":0.1941055199 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ig", + "task":"translation_to", + "metric":"chrf", + "score":0.4504811493 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ilo", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"bleu", + "score":0.1944477164 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"chrf", + "score":0.4517028309 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"bleu", + "score":0.2035517344 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"chrf", + "score":0.489419705 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"it", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"it", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"it", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"it", + "task":"translation_from", + "metric":"bleu", + "score":0.3074361781 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"it", + "task":"translation_from", + "metric":"chrf", + "score":0.5178180754 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"it", + "task":"translation_to", + "metric":"bleu", + "score":0.3505959215 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"it", + "task":"translation_to", + "metric":"chrf", + "score":0.5955060476 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ja", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ja", + "task":"translation_from", + "metric":"bleu", + "score":0.2581140706 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ja", + "task":"translation_from", + "metric":"chrf", + "score":0.5395853617 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ja", + "task":"translation_to", + "metric":"bleu", + "score":0.3298839393 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ja", + "task":"translation_to", + "metric":"chrf", + "score":0.4471547552 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"jv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"jv", + "task":"translation_from", + "metric":"bleu", + "score":0.3177915441 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"jv", + "task":"translation_from", + "metric":"chrf", + "score":0.5387853038 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"jv", + "task":"translation_to", + "metric":"bleu", + "score":0.2549228547 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"jv", + "task":"translation_to", + "metric":"chrf", + "score":0.5322440265 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ki", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ki", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ki", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ki", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ki", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"kk", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"kk", + "task":"translation_from", + "metric":"bleu", + "score":0.1983700044 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"kk", + "task":"translation_from", + "metric":"chrf", + "score":0.4843458319 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"kk", + "task":"translation_to", + "metric":"bleu", + "score":0.2920207746 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"kk", + "task":"translation_to", + "metric":"chrf", + "score":0.5345155349 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"km", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"km", + "task":"translation_from", + "metric":"bleu", + "score":0.3702042307 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"km", + "task":"translation_from", + "metric":"chrf", + "score":0.5776853975 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"km", + "task":"translation_to", + "metric":"bleu", + "score":0.1498433716 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"km", + "task":"translation_to", + "metric":"chrf", + "score":0.3652702605 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"kn", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"kn", + "task":"translation_from", + "metric":"bleu", + "score":0.2858443353 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"kn", + "task":"translation_from", + "metric":"chrf", + "score":0.5499221943 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"kn", + "task":"translation_to", + "metric":"bleu", + "score":0.2481102245 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"kn", + "task":"translation_to", + "metric":"chrf", + "score":0.4829685786 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ko", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ko", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ko", + "task":"translation_from", + "metric":"bleu", + "score":0.2305492704 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ko", + "task":"translation_from", + "metric":"chrf", + "score":0.4826740501 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ko", + "task":"translation_to", + "metric":"bleu", + "score":0.1746024172 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ko", + "task":"translation_to", + "metric":"chrf", + "score":0.3073554703 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"lua", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"lua", + "task":"translation_from", + "metric":"bleu", + "score":0.0913600379 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"lua", + "task":"translation_from", + "metric":"chrf", + "score":0.3305636235 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"lua", + "task":"translation_to", + "metric":"bleu", + "score":0.0269728382 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"lua", + "task":"translation_to", + "metric":"chrf", + "score":0.3155017027 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mag", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mag", + "task":"translation_from", + "metric":"bleu", + "score":0.3751831337 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mag", + "task":"translation_from", + "metric":"chrf", + "score":0.6085851316 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mag", + "task":"translation_to", + "metric":"bleu", + "score":0.259988405 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mag", + "task":"translation_to", + "metric":"chrf", + "score":0.5046714005 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mai", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mai", + "task":"translation_from", + "metric":"bleu", + "score":0.306099972 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mai", + "task":"translation_from", + "metric":"chrf", + "score":0.5370842801 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mai", + "task":"translation_to", + "metric":"bleu", + "score":0.1736022871 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mai", + "task":"translation_to", + "metric":"chrf", + "score":0.4305653856 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mg", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mg", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mg", + "task":"translation_from", + "metric":"bleu", + "score":0.2826629018 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mg", + "task":"translation_from", + "metric":"chrf", + "score":0.5215979873 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mg", + "task":"translation_to", + "metric":"bleu", + "score":0.238462643 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mg", + "task":"translation_to", + "metric":"chrf", + "score":0.5334745774 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ml", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ml", + "task":"translation_from", + "metric":"bleu", + "score":0.3161992509 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ml", + "task":"translation_from", + "metric":"chrf", + "score":0.5479755911 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ml", + "task":"translation_to", + "metric":"bleu", + "score":0.2133071404 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ml", + "task":"translation_to", + "metric":"chrf", + "score":0.4660281027 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mr", + "task":"translation_from", + "metric":"bleu", + "score":0.2370074805 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mr", + "task":"translation_from", + "metric":"chrf", + "score":0.4804215458 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mr", + "task":"translation_to", + "metric":"bleu", + "score":0.2399769139 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"mr", + "task":"translation_to", + "metric":"chrf", + "score":0.4726429935 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ms", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ms", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ms", + "task":"translation_from", + "metric":"bleu", + "score":0.3104483533 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ms", + "task":"translation_from", + "metric":"chrf", + "score":0.5705763492 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ms", + "task":"translation_to", + "metric":"bleu", + "score":0.4229626959 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ms", + "task":"translation_to", + "metric":"chrf", + "score":0.6856510383 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"my", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"my", + "task":"translation_from", + "metric":"bleu", + "score":0.2227645269 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"my", + "task":"translation_from", + "metric":"chrf", + "score":0.4888582617 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"my", + "task":"translation_to", + "metric":"bleu", + "score":0.1869632744 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"my", + "task":"translation_to", + "metric":"chrf", + "score":0.4322398057 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ne", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ne", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ne", + "task":"translation_from", + "metric":"bleu", + "score":0.3115387303 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ne", + "task":"translation_from", + "metric":"chrf", + "score":0.5342290246 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ne", + "task":"translation_to", + "metric":"bleu", + "score":0.22081567 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ne", + "task":"translation_to", + "metric":"chrf", + "score":0.4878836055 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"nl", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"nl", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"nl", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"nl", + "task":"translation_from", + "metric":"bleu", + "score":0.3125704924 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"nl", + "task":"translation_from", + "metric":"chrf", + "score":0.5397676594 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"nl", + "task":"translation_to", + "metric":"bleu", + "score":0.3586968371 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"nl", + "task":"translation_to", + "metric":"chrf", + "score":0.6075205554 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ny", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ny", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ny", + "task":"translation_from", + "metric":"bleu", + "score":0.1901221224 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ny", + "task":"translation_from", + "metric":"chrf", + "score":0.438728736 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ny", + "task":"translation_to", + "metric":"bleu", + "score":0.1330024304 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ny", + "task":"translation_to", + "metric":"chrf", + "score":0.4711022084 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"om", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"om", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"om", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"om", + "task":"translation_from", + "metric":"bleu", + "score":0.0258426139 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"om", + "task":"translation_from", + "metric":"chrf", + "score":0.2237241232 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"om", + "task":"translation_to", + "metric":"bleu", + "score":0.0460531144 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"om", + "task":"translation_to", + "metric":"chrf", + "score":0.3418147419 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"or", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"or", + "task":"translation_from", + "metric":"bleu", + "score":0.3714452662 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"or", + "task":"translation_from", + "metric":"chrf", + "score":0.5977153904 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"or", + "task":"translation_to", + "metric":"bleu", + "score":0.2234825764 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"or", + "task":"translation_to", + "metric":"chrf", + "score":0.4562477173 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pa", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pa", + "task":"translation_from", + "metric":"bleu", + "score":0.4180718844 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pa", + "task":"translation_from", + "metric":"chrf", + "score":0.6426219278 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pa", + "task":"translation_to", + "metric":"bleu", + "score":0.3938693136 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pa", + "task":"translation_to", + "metric":"chrf", + "score":0.5573992167 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pl", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pl", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pl", + "task":"translation_from", + "metric":"bleu", + "score":0.2456102401 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pl", + "task":"translation_from", + "metric":"chrf", + "score":0.5190609119 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pl", + "task":"translation_to", + "metric":"bleu", + "score":0.4265619216 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pl", + "task":"translation_to", + "metric":"chrf", + "score":0.6320824157 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pt", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pt", + "task":"translation_from", + "metric":"bleu", + "score":0.3537745123 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pt", + "task":"translation_from", + "metric":"chrf", + "score":0.5904429929 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pt", + "task":"translation_to", + "metric":"bleu", + "score":0.4588664196 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"pt", + "task":"translation_to", + "metric":"chrf", + "score":0.6844540285 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ro", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ro", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ro", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ro", + "task":"translation_from", + "metric":"bleu", + "score":0.3139442337 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ro", + "task":"translation_from", + "metric":"chrf", + "score":0.5741447282 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ro", + "task":"translation_to", + "metric":"bleu", + "score":0.5016049999 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ro", + "task":"translation_to", + "metric":"chrf", + "score":0.6788048008 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ru", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ru", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ru", + "task":"translation_from", + "metric":"bleu", + "score":0.2449777422 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ru", + "task":"translation_from", + "metric":"chrf", + "score":0.5268764903 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ru", + "task":"translation_to", + "metric":"bleu", + "score":0.3789708434 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ru", + "task":"translation_to", + "metric":"chrf", + "score":0.5790333031 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"rw", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"rw", + "task":"mgsm", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"rw", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"rw", + "task":"translation_from", + "metric":"bleu", + "score":0.1839360587 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"rw", + "task":"translation_from", + "metric":"chrf", + "score":0.448997409 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"rw", + "task":"translation_to", + "metric":"bleu", + "score":0.1891835724 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"rw", + "task":"translation_to", + "metric":"chrf", + "score":0.508623725 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sd", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sd", + "task":"translation_from", + "metric":"bleu", + "score":0.3352727297 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sd", + "task":"translation_from", + "metric":"chrf", + "score":0.5583215205 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sd", + "task":"translation_to", + "metric":"bleu", + "score":0.2009000601 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sd", + "task":"translation_to", + "metric":"chrf", + "score":0.4004383195 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"si", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"si", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"si", + "task":"translation_from", + "metric":"bleu", + "score":0.2297304995 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"si", + "task":"translation_from", + "metric":"chrf", + "score":0.5040607132 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"si", + "task":"translation_to", + "metric":"bleu", + "score":0.2136543311 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"si", + "task":"translation_to", + "metric":"chrf", + "score":0.3916393466 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sn", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sn", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sn", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sn", + "task":"translation_from", + "metric":"bleu", + "score":0.1221415503 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sn", + "task":"translation_from", + "metric":"chrf", + "score":0.3516954503 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sn", + "task":"translation_to", + "metric":"bleu", + "score":0.108688779 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sn", + "task":"translation_to", + "metric":"chrf", + "score":0.4515663403 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"so", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"so", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"so", + "task":"translation_from", + "metric":"bleu", + "score":0.2308889646 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"so", + "task":"translation_from", + "metric":"chrf", + "score":0.4618048204 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"so", + "task":"translation_to", + "metric":"bleu", + "score":0.1667302795 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"so", + "task":"translation_to", + "metric":"chrf", + "score":0.4717296026 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sr", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sr", + "task":"translation_from", + "metric":"bleu", + "score":0.2351861569 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sr", + "task":"translation_from", + "metric":"chrf", + "score":0.5329036218 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sr", + "task":"translation_to", + "metric":"bleu", + "score":0.4168384094 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sr", + "task":"translation_to", + "metric":"chrf", + "score":0.6032787874 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"su", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"su", + "task":"translation_from", + "metric":"bleu", + "score":0.2291561983 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"su", + "task":"translation_from", + "metric":"chrf", + "score":0.4673987803 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"su", + "task":"translation_to", + "metric":"bleu", + "score":0.2036733766 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"su", + "task":"translation_to", + "metric":"chrf", + "score":0.5047620958 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sv", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sv", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sv", + "task":"translation_from", + "metric":"bleu", + "score":0.3500384253 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sv", + "task":"translation_from", + "metric":"chrf", + "score":0.5797456052 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sv", + "task":"translation_to", + "metric":"bleu", + "score":0.4268868445 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sv", + "task":"translation_to", + "metric":"chrf", + "score":0.664863412 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sw", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sw", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sw", + "task":"translation_from", + "metric":"bleu", + "score":0.3005035588 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sw", + "task":"translation_from", + "metric":"chrf", + "score":0.5210660172 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sw", + "task":"translation_to", + "metric":"bleu", + "score":0.3401968092 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"sw", + "task":"translation_to", + "metric":"chrf", + "score":0.6217197146 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ta", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ta", + "task":"translation_from", + "metric":"bleu", + "score":0.2662307086 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ta", + "task":"translation_from", + "metric":"chrf", + "score":0.5053585639 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ta", + "task":"translation_to", + "metric":"bleu", + "score":0.3044345778 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ta", + "task":"translation_to", + "metric":"chrf", + "score":0.5714036731 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"te", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"te", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"te", + "task":"translation_from", + "metric":"bleu", + "score":0.3330093484 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"te", + "task":"translation_from", + "metric":"chrf", + "score":0.5694168709 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"te", + "task":"translation_to", + "metric":"bleu", + "score":0.257812168 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"te", + "task":"translation_to", + "metric":"chrf", + "score":0.5167002436 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"tg", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"tg", + "task":"translation_from", + "metric":"bleu", + "score":0.2176170344 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"tg", + "task":"translation_from", + "metric":"chrf", + "score":0.4496406258 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"tg", + "task":"translation_to", + "metric":"bleu", + "score":0.2605536967 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"tg", + "task":"translation_to", + "metric":"chrf", + "score":0.4816066849 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"th", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"th", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"th", + "task":"translation_from", + "metric":"bleu", + "score":0.2992360169 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"th", + "task":"translation_from", + "metric":"chrf", + "score":0.5585599708 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"th", + "task":"translation_to", + "metric":"bleu", + "score":0.4269079012 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"th", + "task":"translation_to", + "metric":"chrf", + "score":0.5719718715 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ti", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ti", + "task":"translation_from", + "metric":"bleu", + "score":0.2042995208 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ti", + "task":"translation_from", + "metric":"chrf", + "score":0.416626147 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ti", + "task":"translation_to", + "metric":"bleu", + "score":0.0833250166 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ti", + "task":"translation_to", + "metric":"chrf", + "score":0.1982489294 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"tr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"tr", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"tr", + "task":"translation_from", + "metric":"bleu", + "score":0.2832304201 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"tr", + "task":"translation_from", + "metric":"chrf", + "score":0.5467240003 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"tr", + "task":"translation_to", + "metric":"bleu", + "score":0.3273464288 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"tr", + "task":"translation_to", + "metric":"chrf", + "score":0.5827048506 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"uk", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"uk", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"uk", + "task":"translation_from", + "metric":"bleu", + "score":0.2813742416 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"uk", + "task":"translation_from", + "metric":"chrf", + "score":0.5413704266 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"uk", + "task":"translation_to", + "metric":"bleu", + "score":0.4063054094 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"uk", + "task":"translation_to", + "metric":"chrf", + "score":0.6020718231 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"umb", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"umb", + "task":"translation_from", + "metric":"bleu", + "score":0.0495917134 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"umb", + "task":"translation_from", + "metric":"chrf", + "score":0.1711087397 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"umb", + "task":"translation_to", + "metric":"bleu", + "score":0.0358872001 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"umb", + "task":"translation_to", + "metric":"chrf", + "score":0.2761667256 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ur", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ur", + "task":"translation_from", + "metric":"bleu", + "score":0.322448107 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ur", + "task":"translation_from", + "metric":"chrf", + "score":0.5887654616 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ur", + "task":"translation_to", + "metric":"bleu", + "score":0.2148139783 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"ur", + "task":"translation_to", + "metric":"chrf", + "score":0.4226865444 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"uz", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"uz", + "task":"translation_from", + "metric":"bleu", + "score":0.2829644119 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"uz", + "task":"translation_from", + "metric":"chrf", + "score":0.5194956482 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"uz", + "task":"translation_to", + "metric":"bleu", + "score":0.2911955464 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"uz", + "task":"translation_to", + "metric":"chrf", + "score":0.5560139888 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"vi", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"vi", + "task":"translation_from", + "metric":"bleu", + "score":0.2745000434 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"vi", + "task":"translation_from", + "metric":"chrf", + "score":0.5206422805 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"vi", + "task":"translation_to", + "metric":"bleu", + "score":0.4261790941 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"vi", + "task":"translation_to", + "metric":"chrf", + "score":0.6358462464 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"wo", + "task":"classification", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"wo", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"wo", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"wo", + "task":"translation_from", + "metric":"bleu", + "score":0.0696458062 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"wo", + "task":"translation_from", + "metric":"chrf", + "score":0.2461140434 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"wo", + "task":"translation_to", + "metric":"bleu", + "score":0.0728989985 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"wo", + "task":"translation_to", + "metric":"chrf", + "score":0.2267265908 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"wuu", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"bleu", + "score":0.2072386748 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"chrf", + "score":0.4628288648 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"bleu", + "score":0.1471425714 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"chrf", + "score":0.1971299212 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"xh", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"xh", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"xh", + "task":"translation_from", + "metric":"bleu", + "score":0.253783308 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"xh", + "task":"translation_from", + "metric":"chrf", + "score":0.4487387303 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"xh", + "task":"translation_to", + "metric":"bleu", + "score":0.0662544821 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"xh", + "task":"translation_to", + "metric":"chrf", + "score":0.3784904721 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"yo", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"yo", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"yo", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"yo", + "task":"translation_from", + "metric":"bleu", + "score":0.0887390501 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"yo", + "task":"translation_from", + "metric":"chrf", + "score":0.3201148841 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"yo", + "task":"translation_to", + "metric":"bleu", + "score":0.1178050815 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"yo", + "task":"translation_to", + "metric":"chrf", + "score":0.307433063 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"yue", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"yue", + "task":"translation_from", + "metric":"bleu", + "score":0.2253512269 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"yue", + "task":"translation_from", + "metric":"chrf", + "score":0.4949150094 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"yue", + "task":"translation_to", + "metric":"bleu", + "score":0.1897306863 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"yue", + "task":"translation_to", + "metric":"chrf", + "score":0.2561574259 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"zh", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"zh", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"zh", + "task":"translation_from", + "metric":"bleu", + "score":0.2201641871 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"zh", + "task":"translation_from", + "metric":"chrf", + "score":0.5051068628 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"zh", + "task":"translation_to", + "metric":"bleu", + "score":0.2508351517 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"zh", + "task":"translation_to", + "metric":"chrf", + "score":0.3110461024 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"zu", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"zu", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"zu", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"zu", + "task":"translation_from", + "metric":"bleu", + "score":0.252616884 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"zu", + "task":"translation_from", + "metric":"chrf", + "score":0.4822778382 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"zu", + "task":"translation_to", + "metric":"bleu", + "score":0.1940901676 + }, + { + "model":"google\/gemini-flash-1.5", + "bcp_47":"zu", + "task":"translation_to", + "metric":"chrf", + "score":0.4661416094 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"aeb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"bleu", + "score":0.2041309024 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"chrf", + "score":0.4630820951 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"bleu", + "score":0.1453469275 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"chrf", + "score":0.3874336138 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"af", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"af", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"af", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"af", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"af", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ak", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ak", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ak", + "task":"translation_from", + "metric":"bleu", + "score":0.1059711376 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ak", + "task":"translation_from", + "metric":"chrf", + "score":0.300568481 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ak", + "task":"translation_to", + "metric":"bleu", + "score":0.0110669593 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ak", + "task":"translation_to", + "metric":"chrf", + "score":0.2141540563 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"am", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"am", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"am", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"am", + "task":"translation_from", + "metric":"bleu", + "score":0.1906134629 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"am", + "task":"translation_from", + "metric":"chrf", + "score":0.4467868389 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"am", + "task":"translation_to", + "metric":"bleu", + "score":0.2001643223 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"am", + "task":"translation_to", + "metric":"chrf", + "score":0.3225170104 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"apc", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"apc", + "task":"translation_from", + "metric":"bleu", + "score":0.1876459632 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"apc", + "task":"translation_from", + "metric":"chrf", + "score":0.4830875841 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"apc", + "task":"translation_to", + "metric":"bleu", + "score":0.1830944017 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"apc", + "task":"translation_to", + "metric":"chrf", + "score":0.4175337587 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ar", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ar", + "task":"translation_from", + "metric":"bleu", + "score":0.260683336 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ar", + "task":"translation_from", + "metric":"chrf", + "score":0.5383651277 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ar", + "task":"translation_to", + "metric":"bleu", + "score":0.2962406565 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ar", + "task":"translation_to", + "metric":"chrf", + "score":0.5190026627 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ary", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ary", + "task":"translation_from", + "metric":"bleu", + "score":0.1438491224 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ary", + "task":"translation_from", + "metric":"chrf", + "score":0.418499848 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ary", + "task":"translation_to", + "metric":"bleu", + "score":0.1044262978 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ary", + "task":"translation_to", + "metric":"chrf", + "score":0.3577242047 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"arz", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"arz", + "task":"translation_from", + "metric":"bleu", + "score":0.1675595946 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"arz", + "task":"translation_from", + "metric":"chrf", + "score":0.4187188467 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"arz", + "task":"translation_to", + "metric":"bleu", + "score":0.1545869288 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"arz", + "task":"translation_to", + "metric":"chrf", + "score":0.4031218248 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"as", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"as", + "task":"translation_from", + "metric":"bleu", + "score":0.1892328534 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"as", + "task":"translation_from", + "metric":"chrf", + "score":0.4434206925 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"as", + "task":"translation_to", + "metric":"bleu", + "score":0.1070430926 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"as", + "task":"translation_to", + "metric":"chrf", + "score":0.3318636339 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"awa", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"awa", + "task":"translation_from", + "metric":"bleu", + "score":0.3180630074 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"awa", + "task":"translation_from", + "metric":"chrf", + "score":0.5401606876 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"awa", + "task":"translation_to", + "metric":"bleu", + "score":0.1993490206 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"awa", + "task":"translation_to", + "metric":"chrf", + "score":0.4215901923 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"az", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"az", + "task":"translation_from", + "metric":"bleu", + "score":0.1604267099 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"az", + "task":"translation_from", + "metric":"chrf", + "score":0.4139767864 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"az", + "task":"translation_to", + "metric":"bleu", + "score":0.1651025864 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"az", + "task":"translation_to", + "metric":"chrf", + "score":0.3978212407 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"be", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"be", + "task":"translation_from", + "metric":"bleu", + "score":0.19213953 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"be", + "task":"translation_from", + "metric":"chrf", + "score":0.4512512424 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"be", + "task":"translation_to", + "metric":"bleu", + "score":0.2406657525 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"be", + "task":"translation_to", + "metric":"chrf", + "score":0.4536513075 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bho", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bho", + "task":"translation_from", + "metric":"bleu", + "score":0.2519150677 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bho", + "task":"translation_from", + "metric":"chrf", + "score":0.4966963131 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bho", + "task":"translation_to", + "metric":"bleu", + "score":0.2057435019 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bho", + "task":"translation_to", + "metric":"chrf", + "score":0.4016427491 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bm", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bm", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bm", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bm", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bm", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bn", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bn", + "task":"translation_from", + "metric":"bleu", + "score":0.2183929994 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bn", + "task":"translation_from", + "metric":"chrf", + "score":0.4877941086 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bn", + "task":"translation_to", + "metric":"bleu", + "score":0.2700916391 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"bn", + "task":"translation_to", + "metric":"chrf", + "score":0.5150577414 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ca", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ca", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ca", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ca", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ca", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ceb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"bleu", + "score":0.2900668497 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"chrf", + "score":0.5379961095 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"bleu", + "score":0.3193377157 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"chrf", + "score":0.5978978692 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ckb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"bleu", + "score":0.2457083208 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"chrf", + "score":0.4937183307 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"bleu", + "score":0.1424911854 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"chrf", + "score":0.3546559531 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"cs", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"cs", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"cs", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"cs", + "task":"translation_from", + "metric":"bleu", + "score":0.2481120403 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"cs", + "task":"translation_from", + "metric":"chrf", + "score":0.5339550423 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"cs", + "task":"translation_to", + "metric":"bleu", + "score":0.3131426524 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"cs", + "task":"translation_to", + "metric":"chrf", + "score":0.5548197404 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"de", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"de", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"de", + "task":"translation_from", + "metric":"bleu", + "score":0.3440655166 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"de", + "task":"translation_from", + "metric":"chrf", + "score":0.563902418 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"de", + "task":"translation_to", + "metric":"bleu", + "score":0.4305522274 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"de", + "task":"translation_to", + "metric":"chrf", + "score":0.6477508732 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"el", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"el", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"el", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"el", + "task":"translation_from", + "metric":"bleu", + "score":0.2080428665 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"el", + "task":"translation_from", + "metric":"chrf", + "score":0.4376921278 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"el", + "task":"translation_to", + "metric":"bleu", + "score":0.3106300811 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"el", + "task":"translation_to", + "metric":"chrf", + "score":0.4971105137 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"en", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"en", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"en", + "task":"translation_from", + "metric":"bleu", + "score":0.4113463435 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"en", + "task":"translation_from", + "metric":"chrf", + "score":0.6260248317 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"en", + "task":"translation_to", + "metric":"bleu", + "score":0.5310035709 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"en", + "task":"translation_to", + "metric":"chrf", + "score":0.7595845064 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"es", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"es", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"es", + "task":"translation_from", + "metric":"bleu", + "score":0.3031284355 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"es", + "task":"translation_from", + "metric":"chrf", + "score":0.5241309352 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"es", + "task":"translation_to", + "metric":"bleu", + "score":0.3289699508 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"es", + "task":"translation_to", + "metric":"chrf", + "score":0.5811203167 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fa", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fa", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fa", + "task":"translation_from", + "metric":"bleu", + "score":0.2483616515 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fa", + "task":"translation_from", + "metric":"chrf", + "score":0.5338391625 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fa", + "task":"translation_to", + "metric":"bleu", + "score":0.1651229998 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fa", + "task":"translation_to", + "metric":"chrf", + "score":0.3923963113 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fil", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fil", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fil", + "task":"translation_from", + "metric":"bleu", + "score":0.3057177881 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fil", + "task":"translation_from", + "metric":"chrf", + "score":0.5523945263 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fil", + "task":"translation_to", + "metric":"bleu", + "score":0.2711892461 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fil", + "task":"translation_to", + "metric":"chrf", + "score":0.5802332073 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fr", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fr", + "task":"translation_from", + "metric":"bleu", + "score":0.3349110908 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fr", + "task":"translation_from", + "metric":"chrf", + "score":0.564806297 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fr", + "task":"translation_to", + "metric":"bleu", + "score":0.4574014191 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fr", + "task":"translation_to", + "metric":"chrf", + "score":0.6626552528 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fuv", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"bleu", + "score":0.0488154154 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"chrf", + "score":0.1944904286 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"bleu", + "score":0.0115014356 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"chrf", + "score":0.1082073343 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"gu", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"gu", + "task":"translation_from", + "metric":"bleu", + "score":0.2954497906 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"gu", + "task":"translation_from", + "metric":"chrf", + "score":0.5086877895 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"gu", + "task":"translation_to", + "metric":"bleu", + "score":0.1582270271 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"gu", + "task":"translation_to", + "metric":"chrf", + "score":0.4201411039 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ha", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ha", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ha", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ha", + "task":"translation_from", + "metric":"bleu", + "score":0.1697291765 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ha", + "task":"translation_from", + "metric":"chrf", + "score":0.4073157654 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ha", + "task":"translation_to", + "metric":"bleu", + "score":0.139672818 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ha", + "task":"translation_to", + "metric":"chrf", + "score":0.4450194819 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hi", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hi", + "task":"translation_from", + "metric":"bleu", + "score":0.3184042229 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hi", + "task":"translation_from", + "metric":"chrf", + "score":0.5712698408 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hi", + "task":"translation_to", + "metric":"bleu", + "score":0.3659029431 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hi", + "task":"translation_to", + "metric":"chrf", + "score":0.5796195236 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hne", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hne", + "task":"translation_from", + "metric":"bleu", + "score":0.2791185419 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hne", + "task":"translation_from", + "metric":"chrf", + "score":0.5226615992 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hne", + "task":"translation_to", + "metric":"bleu", + "score":0.145820804 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hne", + "task":"translation_to", + "metric":"chrf", + "score":0.3820953887 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ht", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ht", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ht", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ht", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ht", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hu", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hu", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hu", + "task":"translation_from", + "metric":"bleu", + "score":0.2313008892 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hu", + "task":"translation_from", + "metric":"chrf", + "score":0.4915348458 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hu", + "task":"translation_to", + "metric":"bleu", + "score":0.2765024802 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"hu", + "task":"translation_to", + "metric":"chrf", + "score":0.5261755337 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"id", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"id", + "task":"translation_from", + "metric":"bleu", + "score":0.2301748885 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"id", + "task":"translation_from", + "metric":"chrf", + "score":0.4682741896 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"id", + "task":"translation_to", + "metric":"bleu", + "score":0.3346592082 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"id", + "task":"translation_to", + "metric":"chrf", + "score":0.6514874668 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ig", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ig", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ig", + "task":"translation_from", + "metric":"bleu", + "score":0.154261694 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ig", + "task":"translation_from", + "metric":"chrf", + "score":0.3957095627 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ig", + "task":"translation_to", + "metric":"bleu", + "score":0.1177946719 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ig", + "task":"translation_to", + "metric":"chrf", + "score":0.341868335 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ilo", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"bleu", + "score":0.2239397579 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"chrf", + "score":0.4512212104 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"bleu", + "score":0.135748348 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"chrf", + "score":0.4408716957 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"it", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"it", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"it", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"it", + "task":"translation_from", + "metric":"bleu", + "score":0.2724260509 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"it", + "task":"translation_from", + "metric":"chrf", + "score":0.5200202435 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"it", + "task":"translation_to", + "metric":"bleu", + "score":0.2753225284 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"it", + "task":"translation_to", + "metric":"chrf", + "score":0.5457466615 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ja", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ja", + "task":"translation_from", + "metric":"bleu", + "score":0.2664966821 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ja", + "task":"translation_from", + "metric":"chrf", + "score":0.5386982677 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ja", + "task":"translation_to", + "metric":"bleu", + "score":0.2651365589 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ja", + "task":"translation_to", + "metric":"chrf", + "score":0.409095006 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"jv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"jv", + "task":"translation_from", + "metric":"bleu", + "score":0.2326358655 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"jv", + "task":"translation_from", + "metric":"chrf", + "score":0.4815897231 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"jv", + "task":"translation_to", + "metric":"bleu", + "score":0.2187928356 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"jv", + "task":"translation_to", + "metric":"chrf", + "score":0.4896578943 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ki", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ki", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ki", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ki", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ki", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"kk", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"kk", + "task":"translation_from", + "metric":"bleu", + "score":0.1666068635 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"kk", + "task":"translation_from", + "metric":"chrf", + "score":0.4554883841 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"kk", + "task":"translation_to", + "metric":"bleu", + "score":0.1547742726 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"kk", + "task":"translation_to", + "metric":"chrf", + "score":0.4534139462 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"km", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"km", + "task":"translation_from", + "metric":"bleu", + "score":0.2647824193 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"km", + "task":"translation_from", + "metric":"chrf", + "score":0.5269086196 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"km", + "task":"translation_to", + "metric":"bleu", + "score":0.1635334444 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"km", + "task":"translation_to", + "metric":"chrf", + "score":0.3431273828 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"kn", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"kn", + "task":"translation_from", + "metric":"bleu", + "score":0.247746183 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"kn", + "task":"translation_from", + "metric":"chrf", + "score":0.506339637 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"kn", + "task":"translation_to", + "metric":"bleu", + "score":0.1775009719 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"kn", + "task":"translation_to", + "metric":"chrf", + "score":0.4300321597 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ko", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ko", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ko", + "task":"translation_from", + "metric":"bleu", + "score":0.2402657185 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ko", + "task":"translation_from", + "metric":"chrf", + "score":0.497198112 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ko", + "task":"translation_to", + "metric":"bleu", + "score":0.3100527074 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ko", + "task":"translation_to", + "metric":"chrf", + "score":0.3696197774 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"lua", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"lua", + "task":"translation_from", + "metric":"bleu", + "score":0.0872330227 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"lua", + "task":"translation_from", + "metric":"chrf", + "score":0.3059813913 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"lua", + "task":"translation_to", + "metric":"bleu", + "score":0.0010116202 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"lua", + "task":"translation_to", + "metric":"chrf", + "score":0.1893341465 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mag", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mag", + "task":"translation_from", + "metric":"bleu", + "score":0.3447519877 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mag", + "task":"translation_from", + "metric":"chrf", + "score":0.578789784 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mag", + "task":"translation_to", + "metric":"bleu", + "score":0.2508560655 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mag", + "task":"translation_to", + "metric":"chrf", + "score":0.4987822313 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mai", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mai", + "task":"translation_from", + "metric":"bleu", + "score":0.2732982319 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mai", + "task":"translation_from", + "metric":"chrf", + "score":0.5233285219 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mai", + "task":"translation_to", + "metric":"bleu", + "score":0.137657899 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mai", + "task":"translation_to", + "metric":"chrf", + "score":0.3935929024 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mg", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mg", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mg", + "task":"translation_from", + "metric":"bleu", + "score":0.2082275626 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mg", + "task":"translation_from", + "metric":"chrf", + "score":0.4639776287 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mg", + "task":"translation_to", + "metric":"bleu", + "score":0.1350252624 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mg", + "task":"translation_to", + "metric":"chrf", + "score":0.4834543859 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ml", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ml", + "task":"translation_from", + "metric":"bleu", + "score":0.2600500491 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ml", + "task":"translation_from", + "metric":"chrf", + "score":0.5029669853 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ml", + "task":"translation_to", + "metric":"bleu", + "score":0.2091322046 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ml", + "task":"translation_to", + "metric":"chrf", + "score":0.4711774201 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mr", + "task":"translation_from", + "metric":"bleu", + "score":0.2256246926 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mr", + "task":"translation_from", + "metric":"chrf", + "score":0.4703189943 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mr", + "task":"translation_to", + "metric":"bleu", + "score":0.2254492518 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"mr", + "task":"translation_to", + "metric":"chrf", + "score":0.447826525 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ms", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ms", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ms", + "task":"translation_from", + "metric":"bleu", + "score":0.2986303081 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ms", + "task":"translation_from", + "metric":"chrf", + "score":0.5546917725 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ms", + "task":"translation_to", + "metric":"bleu", + "score":0.3680194341 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ms", + "task":"translation_to", + "metric":"chrf", + "score":0.6778287705 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"my", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"my", + "task":"translation_from", + "metric":"bleu", + "score":0.1979480779 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"my", + "task":"translation_from", + "metric":"chrf", + "score":0.4791457508 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"my", + "task":"translation_to", + "metric":"bleu", + "score":0.1536786708 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"my", + "task":"translation_to", + "metric":"chrf", + "score":0.4315811907 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ne", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ne", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ne", + "task":"translation_from", + "metric":"bleu", + "score":0.2955515679 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ne", + "task":"translation_from", + "metric":"chrf", + "score":0.5399574649 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ne", + "task":"translation_to", + "metric":"bleu", + "score":0.2350766648 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ne", + "task":"translation_to", + "metric":"chrf", + "score":0.4890671168 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"nl", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"nl", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"nl", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"nl", + "task":"translation_from", + "metric":"bleu", + "score":0.2583853642 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"nl", + "task":"translation_from", + "metric":"chrf", + "score":0.5143387984 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"nl", + "task":"translation_to", + "metric":"bleu", + "score":0.3585971813 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"nl", + "task":"translation_to", + "metric":"chrf", + "score":0.6255063069 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ny", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ny", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ny", + "task":"translation_from", + "metric":"bleu", + "score":0.1562574059 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ny", + "task":"translation_from", + "metric":"chrf", + "score":0.378833839 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ny", + "task":"translation_to", + "metric":"bleu", + "score":0.1000795039 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ny", + "task":"translation_to", + "metric":"chrf", + "score":0.447037349 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"om", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"om", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"om", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"om", + "task":"translation_from", + "metric":"bleu", + "score":0.0981161875 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"om", + "task":"translation_from", + "metric":"chrf", + "score":0.3370208163 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"om", + "task":"translation_to", + "metric":"bleu", + "score":0.040931235 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"om", + "task":"translation_to", + "metric":"chrf", + "score":0.3615428475 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"or", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"or", + "task":"translation_from", + "metric":"bleu", + "score":0.2626677598 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"or", + "task":"translation_from", + "metric":"chrf", + "score":0.4970567085 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"or", + "task":"translation_to", + "metric":"bleu", + "score":0.1807466012 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"or", + "task":"translation_to", + "metric":"chrf", + "score":0.4219189716 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pa", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pa", + "task":"translation_from", + "metric":"bleu", + "score":0.3706063992 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pa", + "task":"translation_from", + "metric":"chrf", + "score":0.6167676482 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pa", + "task":"translation_to", + "metric":"bleu", + "score":0.4234596823 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pa", + "task":"translation_to", + "metric":"chrf", + "score":0.5629443923 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pl", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pl", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pl", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pl", + "task":"translation_from", + "metric":"bleu", + "score":0.2754265608 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pl", + "task":"translation_from", + "metric":"chrf", + "score":0.5207065369 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pl", + "task":"translation_to", + "metric":"bleu", + "score":0.3700040895 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pl", + "task":"translation_to", + "metric":"chrf", + "score":0.5924241261 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pt", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pt", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pt", + "task":"translation_from", + "metric":"bleu", + "score":0.2971403532 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pt", + "task":"translation_from", + "metric":"chrf", + "score":0.5321068893 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pt", + "task":"translation_to", + "metric":"bleu", + "score":0.4364286549 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"pt", + "task":"translation_to", + "metric":"chrf", + "score":0.6509885745 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ro", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ro", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ro", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ro", + "task":"translation_from", + "metric":"bleu", + "score":0.27702997 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ro", + "task":"translation_from", + "metric":"chrf", + "score":0.5437386483 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ro", + "task":"translation_to", + "metric":"bleu", + "score":0.4580925611 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ro", + "task":"translation_to", + "metric":"chrf", + "score":0.6514836722 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ru", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ru", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ru", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ru", + "task":"translation_from", + "metric":"bleu", + "score":0.2300270544 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ru", + "task":"translation_from", + "metric":"chrf", + "score":0.4839384065 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ru", + "task":"translation_to", + "metric":"bleu", + "score":0.4236492288 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ru", + "task":"translation_to", + "metric":"chrf", + "score":0.6116207052 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"rw", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"rw", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"rw", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"rw", + "task":"translation_from", + "metric":"bleu", + "score":0.1602143293 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"rw", + "task":"translation_from", + "metric":"chrf", + "score":0.3793757948 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"rw", + "task":"translation_to", + "metric":"bleu", + "score":0.1370228414 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"rw", + "task":"translation_to", + "metric":"chrf", + "score":0.4797772284 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sd", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sd", + "task":"translation_from", + "metric":"bleu", + "score":0.2571204202 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sd", + "task":"translation_from", + "metric":"chrf", + "score":0.4946608155 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sd", + "task":"translation_to", + "metric":"bleu", + "score":0.0869374651 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sd", + "task":"translation_to", + "metric":"chrf", + "score":0.3119061498 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"si", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"si", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"si", + "task":"translation_from", + "metric":"bleu", + "score":0.1981443603 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"si", + "task":"translation_from", + "metric":"chrf", + "score":0.4536105905 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"si", + "task":"translation_to", + "metric":"bleu", + "score":0.2278086127 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"si", + "task":"translation_to", + "metric":"chrf", + "score":0.4013315084 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sn", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sn", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sn", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sn", + "task":"translation_from", + "metric":"bleu", + "score":0.0939343156 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sn", + "task":"translation_from", + "metric":"chrf", + "score":0.3129229613 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sn", + "task":"translation_to", + "metric":"bleu", + "score":0.074740365 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sn", + "task":"translation_to", + "metric":"chrf", + "score":0.4045773842 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"so", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"so", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"so", + "task":"translation_from", + "metric":"bleu", + "score":0.2273071628 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"so", + "task":"translation_from", + "metric":"chrf", + "score":0.4497946959 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"so", + "task":"translation_to", + "metric":"bleu", + "score":0.1824497409 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"so", + "task":"translation_to", + "metric":"chrf", + "score":0.4972329945 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sr", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sr", + "task":"translation_from", + "metric":"bleu", + "score":0.2541965029 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sr", + "task":"translation_from", + "metric":"chrf", + "score":0.5234491687 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sr", + "task":"translation_to", + "metric":"bleu", + "score":0.3308712415 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sr", + "task":"translation_to", + "metric":"chrf", + "score":0.5512495988 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"su", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"su", + "task":"translation_from", + "metric":"bleu", + "score":0.1522391036 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"su", + "task":"translation_from", + "metric":"chrf", + "score":0.3508292995 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"su", + "task":"translation_to", + "metric":"bleu", + "score":0.1514782919 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"su", + "task":"translation_to", + "metric":"chrf", + "score":0.4909144205 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sv", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sv", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sv", + "task":"translation_from", + "metric":"bleu", + "score":0.2959760233 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sv", + "task":"translation_from", + "metric":"chrf", + "score":0.5398896148 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sv", + "task":"translation_to", + "metric":"bleu", + "score":0.4357891553 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sv", + "task":"translation_to", + "metric":"chrf", + "score":0.6529723913 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sw", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sw", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sw", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sw", + "task":"translation_from", + "metric":"bleu", + "score":0.2501435914 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sw", + "task":"translation_from", + "metric":"chrf", + "score":0.5088299265 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sw", + "task":"translation_to", + "metric":"bleu", + "score":0.262372343 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"sw", + "task":"translation_to", + "metric":"chrf", + "score":0.5806899403 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ta", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ta", + "task":"translation_from", + "metric":"bleu", + "score":0.2450100573 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ta", + "task":"translation_from", + "metric":"chrf", + "score":0.4918691312 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ta", + "task":"translation_to", + "metric":"bleu", + "score":0.2434733519 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ta", + "task":"translation_to", + "metric":"chrf", + "score":0.5120095348 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"te", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"te", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"te", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"te", + "task":"translation_from", + "metric":"bleu", + "score":0.3568851036 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"te", + "task":"translation_from", + "metric":"chrf", + "score":0.5825326367 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"te", + "task":"translation_to", + "metric":"bleu", + "score":0.3112091725 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"te", + "task":"translation_to", + "metric":"chrf", + "score":0.5431414206 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"tg", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"tg", + "task":"translation_from", + "metric":"bleu", + "score":0.1741933649 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"tg", + "task":"translation_from", + "metric":"chrf", + "score":0.4272342177 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"tg", + "task":"translation_to", + "metric":"bleu", + "score":0.1811584685 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"tg", + "task":"translation_to", + "metric":"chrf", + "score":0.4001890626 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"th", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"th", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"th", + "task":"translation_from", + "metric":"bleu", + "score":0.2544201673 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"th", + "task":"translation_from", + "metric":"chrf", + "score":0.5081271409 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"th", + "task":"translation_to", + "metric":"bleu", + "score":0.2942923294 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"th", + "task":"translation_to", + "metric":"chrf", + "score":0.4479604827 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ti", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ti", + "task":"translation_from", + "metric":"bleu", + "score":0.0881111208 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ti", + "task":"translation_from", + "metric":"chrf", + "score":0.3173214379 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ti", + "task":"translation_to", + "metric":"bleu", + "score":0.0384668791 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ti", + "task":"translation_to", + "metric":"chrf", + "score":0.1259439982 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"tr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"tr", + "task":"mmlu", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"tr", + "task":"translation_from", + "metric":"bleu", + "score":0.2563119866 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"tr", + "task":"translation_from", + "metric":"chrf", + "score":0.5291012922 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"tr", + "task":"translation_to", + "metric":"bleu", + "score":0.3009595898 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"tr", + "task":"translation_to", + "metric":"chrf", + "score":0.5854044281 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"uk", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"uk", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"uk", + "task":"translation_from", + "metric":"bleu", + "score":0.2567288533 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"uk", + "task":"translation_from", + "metric":"chrf", + "score":0.5177571061 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"uk", + "task":"translation_to", + "metric":"bleu", + "score":0.3201007033 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"uk", + "task":"translation_to", + "metric":"chrf", + "score":0.5323037228 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"umb", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"umb", + "task":"translation_from", + "metric":"bleu", + "score":0.0115980217 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"umb", + "task":"translation_from", + "metric":"chrf", + "score":0.115883071 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"umb", + "task":"translation_to", + "metric":"bleu", + "score":0.0129780747 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"umb", + "task":"translation_to", + "metric":"chrf", + "score":0.1450749981 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ur", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ur", + "task":"translation_from", + "metric":"bleu", + "score":0.2402951661 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ur", + "task":"translation_from", + "metric":"chrf", + "score":0.5033005385 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ur", + "task":"translation_to", + "metric":"bleu", + "score":0.2302239803 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"ur", + "task":"translation_to", + "metric":"chrf", + "score":0.4066956434 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"uz", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"uz", + "task":"translation_from", + "metric":"bleu", + "score":0.203750264 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"uz", + "task":"translation_from", + "metric":"chrf", + "score":0.4979829233 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"uz", + "task":"translation_to", + "metric":"bleu", + "score":0.2162945849 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"uz", + "task":"translation_to", + "metric":"chrf", + "score":0.4941278712 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"vi", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"vi", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"vi", + "task":"translation_from", + "metric":"bleu", + "score":0.2537752957 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"vi", + "task":"translation_from", + "metric":"chrf", + "score":0.5073147534 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"vi", + "task":"translation_to", + "metric":"bleu", + "score":0.3583753747 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"vi", + "task":"translation_to", + "metric":"chrf", + "score":0.6253917282 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"wo", + "task":"classification", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"wo", + "task":"mgsm", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"wo", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"wo", + "task":"translation_from", + "metric":"bleu", + "score":0.1081430594 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"wo", + "task":"translation_from", + "metric":"chrf", + "score":0.2665454299 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"wo", + "task":"translation_to", + "metric":"bleu", + "score":0.0142970887 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"wo", + "task":"translation_to", + "metric":"chrf", + "score":0.1489810124 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"wuu", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"bleu", + "score":0.1700904158 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"wuu", + "task":"translation_from", + "metric":"chrf", + "score":0.421111634 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"bleu", + "score":0.1213993524 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"wuu", + "task":"translation_to", + "metric":"chrf", + "score":0.1655788185 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"xh", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"xh", + "task":"mgsm", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"xh", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"xh", + "task":"translation_from", + "metric":"bleu", + "score":0.1531171972 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"xh", + "task":"translation_from", + "metric":"chrf", + "score":0.3828830786 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"xh", + "task":"translation_to", + "metric":"bleu", + "score":0.0483942569 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"xh", + "task":"translation_to", + "metric":"chrf", + "score":0.3116951706 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"yo", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"yo", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"yo", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"yo", + "task":"translation_from", + "metric":"bleu", + "score":0.0816098185 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"yo", + "task":"translation_from", + "metric":"chrf", + "score":0.2781732759 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"yo", + "task":"translation_to", + "metric":"bleu", + "score":0.041496472 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"yo", + "task":"translation_to", + "metric":"chrf", + "score":0.202397124 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"yue", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"yue", + "task":"translation_from", + "metric":"bleu", + "score":0.1783312983 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"yue", + "task":"translation_from", + "metric":"chrf", + "score":0.4423885999 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"yue", + "task":"translation_to", + "metric":"bleu", + "score":0.1632112014 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"yue", + "task":"translation_to", + "metric":"chrf", + "score":0.2297357227 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"zh", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"zh", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"zh", + "task":"mmlu", + "metric":"accuracy", + "score":0.9 }, { "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"zh", + "task":"translation_from", + "metric":"bleu", + "score":0.249810194 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"zh", + "task":"translation_from", + "metric":"chrf", + "score":0.5151255506 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"zh", + "task":"translation_to", + "metric":"bleu", + "score":0.1854861198 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"zh", + "task":"translation_to", + "metric":"chrf", + "score":0.2463326959 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"zu", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"zu", + "task":"mgsm", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"zu", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"zu", + "task":"translation_from", + "metric":"bleu", + "score":0.1729786376 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"zu", + "task":"translation_from", + "metric":"chrf", + "score":0.4189697233 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"zu", + "task":"translation_to", + "metric":"bleu", + "score":0.0866404913 + }, + { + "model":"google\/gemini-flash-1.5-8b", + "bcp_47":"zu", + "task":"translation_to", + "metric":"chrf", + "score":0.3943277627 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"aeb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"bleu", + "score":0.2177971147 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"aeb", + "task":"translation_from", + "metric":"chrf", + "score":0.4738076987 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"bleu", + "score":0.1414064724 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"aeb", + "task":"translation_to", + "metric":"chrf", + "score":0.3965739567 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"af", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"af", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"af", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"af", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"af", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ak", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ak", + "task":"mgsm", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ak", + "task":"mmlu", + "metric":"accuracy", + "score":0.1 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ak", + "task":"translation_from", + "metric":"bleu", + "score":0.076595229 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ak", + "task":"translation_from", + "metric":"chrf", + "score":0.2493366365 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ak", + "task":"translation_to", + "metric":"bleu", + "score":0.0440715947 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ak", + "task":"translation_to", + "metric":"chrf", + "score":0.2820233612 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"am", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"am", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"am", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"am", + "task":"translation_from", + "metric":"bleu", + "score":0.1913062339 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"am", + "task":"translation_from", + "metric":"chrf", + "score":0.4296053228 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"am", + "task":"translation_to", + "metric":"bleu", + "score":0.13443556 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"am", + "task":"translation_to", + "metric":"chrf", + "score":0.2528930204 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"apc", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"apc", + "task":"translation_from", + "metric":"bleu", + "score":0.24265587 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"apc", + "task":"translation_from", + "metric":"chrf", + "score":0.4918380331 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"apc", + "task":"translation_to", + "metric":"bleu", + "score":0.2104382871 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"apc", + "task":"translation_to", + "metric":"chrf", + "score":0.456050442 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ar", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ar", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ar", + "task":"translation_from", + "metric":"bleu", + "score":0.2891206499 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ar", + "task":"translation_from", + "metric":"chrf", + "score":0.5438550217 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ar", + "task":"translation_to", + "metric":"bleu", + "score":0.3184721364 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ar", + "task":"translation_to", + "metric":"chrf", + "score":0.5483731849 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ary", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ary", + "task":"translation_from", + "metric":"bleu", + "score":0.1664804364 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ary", + "task":"translation_from", + "metric":"chrf", + "score":0.4585261833 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ary", + "task":"translation_to", + "metric":"bleu", + "score":0.1299183594 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ary", + "task":"translation_to", + "metric":"chrf", + "score":0.3752977557 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"arz", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"arz", + "task":"translation_from", + "metric":"bleu", + "score":0.1618648119 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"arz", + "task":"translation_from", + "metric":"chrf", + "score":0.4104839109 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"arz", + "task":"translation_to", + "metric":"bleu", + "score":0.2266738862 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"arz", + "task":"translation_to", + "metric":"chrf", + "score":0.4315390742 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"as", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"as", + "task":"translation_from", + "metric":"bleu", + "score":0.2602059805 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"as", + "task":"translation_from", + "metric":"chrf", + "score":0.4987515978 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"as", + "task":"translation_to", + "metric":"bleu", + "score":0.0907943093 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"as", + "task":"translation_to", + "metric":"chrf", + "score":0.348768221 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"awa", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"awa", + "task":"translation_from", + "metric":"bleu", + "score":0.3277667824 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"awa", + "task":"translation_from", + "metric":"chrf", + "score":0.5267403611 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"awa", + "task":"translation_to", + "metric":"bleu", + "score":0.2123273366 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"awa", + "task":"translation_to", + "metric":"chrf", + "score":0.408906638 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"az", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"az", + "task":"translation_from", + "metric":"bleu", + "score":0.1880331404 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"az", + "task":"translation_from", + "metric":"chrf", + "score":0.4234748209 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"az", + "task":"translation_to", + "metric":"bleu", + "score":0.1517877566 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"az", + "task":"translation_to", + "metric":"chrf", + "score":0.423956163 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"be", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"be", + "task":"translation_from", + "metric":"bleu", + "score":0.148851004 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"be", + "task":"translation_from", + "metric":"chrf", + "score":0.4514291775 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"be", + "task":"translation_to", + "metric":"bleu", + "score":0.3105472783 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"be", + "task":"translation_to", + "metric":"chrf", + "score":0.498684126 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bho", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bho", + "task":"translation_from", + "metric":"bleu", + "score":0.2430984589 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bho", + "task":"translation_from", + "metric":"chrf", + "score":0.4969060141 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bho", + "task":"translation_to", + "metric":"bleu", + "score":0.1699224465 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bho", + "task":"translation_to", + "metric":"chrf", + "score":0.3964402252 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bm", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bm", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bm", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bm", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bm", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bn", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bn", + "task":"mgsm", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bn", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bn", + "task":"translation_from", + "metric":"bleu", + "score":0.2907230812 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bn", + "task":"translation_from", + "metric":"chrf", + "score":0.5148223626 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bn", + "task":"translation_to", + "metric":"bleu", + "score":0.3473636391 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"bn", + "task":"translation_to", + "metric":"chrf", + "score":0.5442574441 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ca", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ca", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ca", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ca", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ca", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ceb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"bleu", + "score":0.3650597419 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ceb", + "task":"translation_from", + "metric":"chrf", + "score":0.5512750223 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"bleu", + "score":0.293824845 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ceb", + "task":"translation_to", + "metric":"chrf", + "score":0.5724817779 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ckb", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"bleu", + "score":0.1983726871 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ckb", + "task":"translation_from", + "metric":"chrf", + "score":0.4779908235 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"bleu", + "score":0.0792877335 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ckb", + "task":"translation_to", + "metric":"chrf", + "score":0.3908004248 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"cs", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"cs", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"cs", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"cs", + "task":"translation_from", + "metric":"bleu", + "score":0.2863884915 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"cs", + "task":"translation_from", + "metric":"chrf", + "score":0.5641108436 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"cs", + "task":"translation_to", + "metric":"bleu", + "score":0.352498756 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"cs", + "task":"translation_to", + "metric":"chrf", + "score":0.5860513143 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"de", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"de", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"de", + "task":"mmlu", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"de", + "task":"translation_from", + "metric":"bleu", + "score":0.3577876868 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"de", + "task":"translation_from", + "metric":"chrf", + "score":0.5943423055 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"de", + "task":"translation_to", + "metric":"bleu", + "score":0.5344280565 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"de", + "task":"translation_to", + "metric":"chrf", + "score":0.7084649844 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"el", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"el", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"el", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"el", + "task":"translation_from", + "metric":"bleu", + "score":0.2914236052 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"el", + "task":"translation_from", + "metric":"chrf", + "score":0.5147962724 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"el", + "task":"translation_to", + "metric":"bleu", + "score":0.3761179017 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"el", + "task":"translation_to", + "metric":"chrf", + "score":0.5590147212 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"en", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"en", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"en", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"en", + "task":"translation_from", + "metric":"bleu", + "score":0.452427177 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"en", + "task":"translation_from", + "metric":"chrf", + "score":0.6525566656 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"en", + "task":"translation_to", + "metric":"bleu", + "score":0.5467976399 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"en", + "task":"translation_to", + "metric":"chrf", + "score":0.7780833183 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"es", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"es", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"es", + "task":"mmlu", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"es", + "task":"translation_from", + "metric":"bleu", + "score":0.3554331718 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"es", + "task":"translation_from", + "metric":"chrf", + "score":0.5997743406 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"es", + "task":"translation_to", + "metric":"bleu", + "score":0.3847830842 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"es", + "task":"translation_to", + "metric":"chrf", + "score":0.6191109047 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fa", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fa", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fa", + "task":"translation_from", + "metric":"bleu", + "score":0.2579194729 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fa", + "task":"translation_from", + "metric":"chrf", + "score":0.5351839762 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fa", + "task":"translation_to", + "metric":"bleu", + "score":0.1571676635 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fa", + "task":"translation_to", + "metric":"chrf", + "score":0.4046770996 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fil", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fil", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fil", + "task":"translation_from", + "metric":"bleu", + "score":0.3771043132 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fil", + "task":"translation_from", + "metric":"chrf", + "score":0.5835797455 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fil", + "task":"translation_to", + "metric":"bleu", + "score":0.3564426025 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fil", + "task":"translation_to", + "metric":"chrf", + "score":0.6107274367 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fr", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fr", + "task":"mgsm", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fr", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fr", + "task":"translation_from", + "metric":"bleu", + "score":0.2846092378 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fr", + "task":"translation_from", + "metric":"chrf", + "score":0.5655970541 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fr", + "task":"translation_to", + "metric":"bleu", + "score":0.5192984544 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fr", + "task":"translation_to", + "metric":"chrf", + "score":0.7020040834 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fuv", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"bleu", + "score":0.0220051815 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fuv", + "task":"translation_from", + "metric":"chrf", + "score":0.1861453784 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"bleu", + "score":0.0227307294 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"fuv", + "task":"translation_to", + "metric":"chrf", + "score":0.1850492522 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"gu", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"gu", + "task":"translation_from", + "metric":"bleu", + "score":0.2796934014 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"gu", + "task":"translation_from", + "metric":"chrf", + "score":0.5155626456 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"gu", + "task":"translation_to", + "metric":"bleu", + "score":0.1979202011 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"gu", + "task":"translation_to", + "metric":"chrf", + "score":0.4528880823 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ha", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ha", + "task":"mgsm", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ha", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ha", + "task":"translation_from", + "metric":"bleu", + "score":0.1595296755 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ha", + "task":"translation_from", + "metric":"chrf", + "score":0.3859356797 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ha", + "task":"translation_to", + "metric":"bleu", + "score":0.171830216 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ha", + "task":"translation_to", + "metric":"chrf", + "score":0.4608354018 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hi", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hi", + "task":"mmlu", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hi", + "task":"translation_from", + "metric":"bleu", + "score":0.3520691191 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hi", + "task":"translation_from", + "metric":"chrf", + "score":0.6035990708 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hi", + "task":"translation_to", + "metric":"bleu", + "score":0.3987037224 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hi", + "task":"translation_to", + "metric":"chrf", + "score":0.6195037668 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hne", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hne", + "task":"translation_from", + "metric":"bleu", + "score":0.2709410734 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hne", + "task":"translation_from", + "metric":"chrf", + "score":0.4976144005 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hne", + "task":"translation_to", + "metric":"bleu", + "score":0.1150407607 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hne", + "task":"translation_to", + "metric":"chrf", + "score":0.3709160058 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ht", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ht", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ht", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ht", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ht", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hu", + "task":"classification", + "metric":"accuracy", + "score":0.8 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hu", + "task":"mgsm", + "metric":"accuracy", + "score":0.5 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hu", + "task":"translation_from", + "metric":"bleu", + "score":0.2903150375 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hu", + "task":"translation_from", + "metric":"chrf", + "score":0.5392715859 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hu", + "task":"translation_to", + "metric":"bleu", + "score":0.3460432788 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"hu", + "task":"translation_to", + "metric":"chrf", + "score":0.6009670508 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"id", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"id", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"id", + "task":"translation_from", + "metric":"bleu", + "score":0.3377417704 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"id", + "task":"translation_from", + "metric":"chrf", + "score":0.5674360496 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"id", + "task":"translation_to", + "metric":"bleu", + "score":0.3534620252 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"id", + "task":"translation_to", + "metric":"chrf", + "score":0.6680177029 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ig", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ig", + "task":"mgsm", + "metric":"accuracy", + "score":0.6 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ig", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ig", + "task":"translation_from", + "metric":"bleu", + "score":0.1600009223 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ig", + "task":"translation_from", + "metric":"chrf", + "score":0.3857586031 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ig", + "task":"translation_to", + "metric":"bleu", + "score":0.1602266912 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ig", + "task":"translation_to", + "metric":"chrf", + "score":0.4091024664 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ilo", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"bleu", + "score":0.1546473042 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ilo", + "task":"translation_from", + "metric":"chrf", + "score":0.3985794204 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"bleu", + "score":0.1752645287 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ilo", + "task":"translation_to", + "metric":"chrf", + "score":0.4668449261 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"it", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"it", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"it", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"it", + "task":"translation_from", + "metric":"bleu", + "score":0.3356485456 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"it", + "task":"translation_from", + "metric":"chrf", + "score":0.5684527887 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"it", + "task":"translation_to", + "metric":"bleu", + "score":0.3627134123 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"it", + "task":"translation_to", + "metric":"chrf", + "score":0.6050822949 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ja", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ja", + "task":"mgsm", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ja", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ja", + "task":"translation_from", + "metric":"bleu", + "score":0.2481856237 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ja", + "task":"translation_from", + "metric":"chrf", + "score":0.5180749152 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ja", + "task":"translation_to", + "metric":"bleu", + "score":0.242508046 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ja", + "task":"translation_to", + "metric":"chrf", + "score":0.4046420215 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"jv", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"jv", + "task":"translation_from", + "metric":"bleu", + "score":0.3019627022 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"jv", + "task":"translation_from", + "metric":"chrf", + "score":0.5133980923 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"jv", + "task":"translation_to", + "metric":"bleu", + "score":0.2316517545 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"jv", + "task":"translation_to", + "metric":"chrf", + "score":0.5189963647 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ki", + "task":"classification", + "metric":"accuracy", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ki", + "task":"translation_from", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ki", + "task":"translation_from", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ki", + "task":"translation_to", + "metric":"bleu", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ki", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"kk", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"kk", + "task":"translation_from", + "metric":"bleu", + "score":0.2187004813 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"kk", + "task":"translation_from", + "metric":"chrf", + "score":0.4910590831 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"kk", + "task":"translation_to", + "metric":"bleu", + "score":0.2108939118 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"kk", + "task":"translation_to", + "metric":"chrf", + "score":0.4375825873 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"km", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"km", + "task":"translation_from", + "metric":"bleu", + "score":0.3274744668 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"km", + "task":"translation_from", + "metric":"chrf", + "score":0.5605813039 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"km", + "task":"translation_to", + "metric":"bleu", + "score":0.0800539722 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"km", + "task":"translation_to", + "metric":"chrf", + "score":0.3336188156 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"kn", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"kn", + "task":"translation_from", + "metric":"bleu", + "score":0.2692189197 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"kn", + "task":"translation_from", + "metric":"chrf", + "score":0.5290912174 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"kn", + "task":"translation_to", + "metric":"bleu", + "score":0.2869741566 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"kn", + "task":"translation_to", + "metric":"chrf", + "score":0.5072256514 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ko", + "task":"classification", + "metric":"accuracy", + "score":0.9 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ko", + "task":"mmlu", + "metric":"accuracy", + "score":0.3 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ko", + "task":"translation_from", + "metric":"bleu", + "score":0.2172591082 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ko", + "task":"translation_from", + "metric":"chrf", + "score":0.478962626 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ko", + "task":"translation_to", + "metric":"bleu", + "score":0.2169046229 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ko", + "task":"translation_to", + "metric":"chrf", + "score":0.3151387909 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"lua", + "task":"classification", + "metric":"accuracy", + "score":0.7 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"lua", + "task":"translation_from", + "metric":"bleu", + "score":0.0905061152 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"lua", + "task":"translation_from", + "metric":"chrf", + "score":0.321707617 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"lua", + "task":"translation_to", + "metric":"bleu", + "score":0.0361920973 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"lua", + "task":"translation_to", + "metric":"chrf", + "score":0.222315171 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mag", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mag", + "task":"translation_from", + "metric":"bleu", + "score":0.3100950481 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mag", + "task":"translation_from", + "metric":"chrf", + "score":0.558054933 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mag", + "task":"translation_to", + "metric":"bleu", + "score":0.2213152575 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mag", + "task":"translation_to", + "metric":"chrf", + "score":0.4821662369 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mai", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mai", + "task":"translation_from", + "metric":"bleu", + "score":0.3126340837 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mai", + "task":"translation_from", + "metric":"chrf", + "score":0.5601639768 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mai", + "task":"translation_to", + "metric":"bleu", + "score":0.1875297747 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mai", + "task":"translation_to", + "metric":"chrf", + "score":0.4394137195 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mg", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mg", + "task":"mmlu", + "metric":"accuracy", + "score":0.4 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mg", + "task":"translation_from", + "metric":"bleu", + "score":0.2502298144 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mg", + "task":"translation_from", + "metric":"chrf", + "score":0.5206889602 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mg", + "task":"translation_to", + "metric":"bleu", + "score":0.1301910408 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mg", + "task":"translation_to", + "metric":"chrf", + "score":0.4488625613 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ml", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ml", + "task":"translation_from", + "metric":"bleu", + "score":0.2809005667 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ml", + "task":"translation_from", + "metric":"chrf", + "score":0.5466717628 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ml", + "task":"translation_to", + "metric":"bleu", + "score":0.2287455417 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ml", + "task":"translation_to", + "metric":"chrf", + "score":0.4915489263 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mr", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mr", + "task":"translation_from", + "metric":"bleu", + "score":0.3395095603 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mr", + "task":"translation_from", + "metric":"chrf", + "score":0.5877742809 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mr", + "task":"translation_to", + "metric":"bleu", + "score":0.2222923122 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"mr", + "task":"translation_to", + "metric":"chrf", + "score":0.4572688692 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ms", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ms", + "task":"mmlu", + "metric":"accuracy", + "score":0.2 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ms", + "task":"translation_from", + "metric":"bleu", + "score":0.3794800258 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ms", + "task":"translation_from", + "metric":"chrf", + "score":0.6256125923 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ms", + "task":"translation_to", + "metric":"bleu", + "score":0.3593747877 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"ms", + "task":"translation_to", + "metric":"chrf", + "score":0.664135376 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"my", + "task":"classification", + "metric":"accuracy", + "score":1.0 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"my", + "task":"translation_from", + "metric":"bleu", + "score":0.251920694 + }, + { + "model":"google\/gemma-3-27b-it", + "bcp_47":"my", + "task":"translation_from", + "metric":"chrf", + "score":0.4662583176 + }, + { + "model":"google\/gemma-3-27b-it", "bcp_47":"my", "task":"translation_to", "metric":"bleu", - "score":0.1536786708 + "score":0.1647980206 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"my", "task":"translation_to", "metric":"chrf", - "score":0.4315811907 + "score":0.4166796691 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ne", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ne", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.4 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ne", "task":"translation_from", "metric":"bleu", - "score":0.2955515679 + "score":0.3022338928 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ne", "task":"translation_from", "metric":"chrf", - "score":0.5399574649 + "score":0.5587522289 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ne", "task":"translation_to", "metric":"bleu", - "score":0.2350766648 + "score":0.2252421952 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ne", "task":"translation_to", "metric":"chrf", - "score":0.4890671168 + "score":0.4768786292 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"nl", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"nl", "task":"mgsm", "metric":"accuracy", - "score":0.7 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"nl", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.4 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"nl", "task":"translation_from", "metric":"bleu", - "score":0.2583853642 + "score":0.2793746981 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"nl", "task":"translation_from", "metric":"chrf", - "score":0.5143387984 + "score":0.5246312011 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"nl", "task":"translation_to", "metric":"bleu", - "score":0.3585971813 + "score":0.3496466203 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"nl", "task":"translation_to", "metric":"chrf", - "score":0.6255063069 + "score":0.6032151622 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ny", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ny", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.3 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ny", "task":"translation_from", "metric":"bleu", - "score":0.1562574059 + "score":0.119086784 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ny", "task":"translation_from", "metric":"chrf", - "score":0.378833839 + "score":0.3898511388 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ny", "task":"translation_to", "metric":"bleu", - "score":0.1000795039 + "score":0.0923649849 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ny", "task":"translation_to", "metric":"chrf", - "score":0.447037349 + "score":0.4837931302 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"om", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"om", "task":"mgsm", "metric":"accuracy", - "score":0.2 + "score":0.1 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"om", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.2 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"om", "task":"translation_from", "metric":"bleu", - "score":0.0981161875 + "score":0.0417850648 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"om", "task":"translation_from", "metric":"chrf", - "score":0.3370208163 + "score":0.2509675066 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"om", "task":"translation_to", "metric":"bleu", - "score":0.040931235 + "score":0.0312813941 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"om", "task":"translation_to", "metric":"chrf", - "score":0.3615428475 + "score":0.2886309955 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"or", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"or", "task":"translation_from", "metric":"bleu", - "score":0.2626677598 + "score":0.2613495089 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"or", "task":"translation_from", "metric":"chrf", - "score":0.4970567085 + "score":0.5009335042 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"or", "task":"translation_to", "metric":"bleu", - "score":0.1807466012 + "score":0.1648455996 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"or", "task":"translation_to", "metric":"chrf", - "score":0.4219189716 + "score":0.3943041737 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"pa", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"pa", "task":"translation_from", "metric":"bleu", - "score":0.3706063992 + "score":0.4164890636 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"pa", "task":"translation_from", "metric":"chrf", - "score":0.6167676482 + "score":0.6375470445 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"pa", "task":"translation_to", "metric":"bleu", - "score":0.4234596823 + "score":0.4166823661 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"pa", "task":"translation_to", "metric":"chrf", - "score":0.5629443923 + "score":0.575314128 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"pl", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"pl", "task":"mgsm", "metric":"accuracy", - "score":0.6 + "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"pl", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.2 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"pl", "task":"translation_from", "metric":"bleu", - "score":0.2754265608 + "score":0.2913506513 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"pl", "task":"translation_from", "metric":"chrf", - "score":0.5207065369 + "score":0.5431985912 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"pl", "task":"translation_to", "metric":"bleu", - "score":0.3700040895 + "score":0.3723742743 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"pl", "task":"translation_to", "metric":"chrf", - "score":0.5924241261 + "score":0.5891983505 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"pt", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"pt", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.6 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.2971403532 + "score":0.340245547 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.5321068893 + "score":0.5681284927 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.4364286549 + "score":0.4702737577 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.6509885745 + "score":0.6903236014 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ro", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ro", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.6 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ro", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.5 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ro", "task":"translation_from", "metric":"bleu", - "score":0.27702997 + "score":0.272965046 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ro", "task":"translation_from", "metric":"chrf", - "score":0.5437386483 + "score":0.5527916308 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ro", "task":"translation_to", "metric":"bleu", - "score":0.4580925611 + "score":0.5195197328 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ro", "task":"translation_to", "metric":"chrf", - "score":0.6514836722 + "score":0.6892729705 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ru", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ru", "task":"mgsm", "metric":"accuracy", - "score":0.9 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ru", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.3 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.2300270544 + "score":0.2862936285 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.4839384065 + "score":0.5264436928 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ru", "task":"translation_to", "metric":"bleu", - "score":0.4236492288 + "score":0.4800957551 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ru", "task":"translation_to", "metric":"chrf", - "score":0.6116207052 + "score":0.6618495803 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"rw", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"rw", "task":"mgsm", "metric":"accuracy", - "score":0.2 + "score":0.3 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"rw", "task":"mmlu", "metric":"accuracy", - "score":0.5 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"rw", "task":"translation_from", "metric":"bleu", - "score":0.1602143293 + "score":0.1701995093 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"rw", "task":"translation_from", "metric":"chrf", - "score":0.3793757948 + "score":0.4262662427 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"rw", "task":"translation_to", "metric":"bleu", - "score":0.1370228414 + "score":0.1513262342 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"rw", "task":"translation_to", "metric":"chrf", - "score":0.4797772284 + "score":0.4732082637 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sd", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sd", "task":"translation_from", "metric":"bleu", - "score":0.2571204202 + "score":0.2365858071 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sd", "task":"translation_from", "metric":"chrf", - "score":0.4946608155 + "score":0.4722212406 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sd", "task":"translation_to", "metric":"bleu", - "score":0.0869374651 + "score":0.2251623508 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sd", "task":"translation_to", "metric":"chrf", - "score":0.3119061498 + "score":0.4159341653 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"si", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"si", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.4 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"si", "task":"translation_from", "metric":"bleu", - "score":0.1981443603 + "score":0.226689844 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"si", "task":"translation_from", "metric":"chrf", - "score":0.4536105905 + "score":0.4706510499 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"si", "task":"translation_to", "metric":"bleu", - "score":0.2278086127 + "score":0.2258552473 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"si", "task":"translation_to", "metric":"chrf", - "score":0.4013315084 + "score":0.4191499082 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sn", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sn", "task":"mgsm", "metric":"accuracy", - "score":0.1 + "score":0.4 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sn", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.5 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sn", "task":"translation_from", "metric":"bleu", - "score":0.0939343156 + "score":0.0756830418 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sn", "task":"translation_from", "metric":"chrf", - "score":0.3129229613 + "score":0.3184767575 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sn", "task":"translation_to", "metric":"bleu", - "score":0.074740365 + "score":0.0495523985 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sn", "task":"translation_to", "metric":"chrf", - "score":0.4045773842 + "score":0.3971096934 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"so", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"so", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.5 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"so", "task":"translation_from", "metric":"bleu", - "score":0.2273071628 + "score":0.1915993132 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"so", "task":"translation_from", "metric":"chrf", - "score":0.4497946959 + "score":0.4208812642 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"so", "task":"translation_to", "metric":"bleu", - "score":0.1824497409 + "score":0.1724511246 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"so", "task":"translation_to", "metric":"chrf", - "score":0.4972329945 + "score":0.4741419887 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sr", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sr", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.6 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sr", "task":"translation_from", "metric":"bleu", - "score":0.2541965029 + "score":0.245439349 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sr", "task":"translation_from", "metric":"chrf", - "score":0.5234491687 + "score":0.536270172 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sr", "task":"translation_to", "metric":"bleu", - "score":0.3308712415 + "score":0.3929818488 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sr", "task":"translation_to", "metric":"chrf", - "score":0.5512495988 + "score":0.5787667028 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"su", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"su", "task":"translation_from", "metric":"bleu", - "score":0.1522391036 + "score":0.1784974236 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"su", "task":"translation_from", "metric":"chrf", - "score":0.3508292995 + "score":0.4520828188 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"su", "task":"translation_to", "metric":"bleu", - "score":0.1514782919 + "score":0.1435021957 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"su", "task":"translation_to", "metric":"chrf", - "score":0.4909144205 + "score":0.4868234587 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sv", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sv", "task":"mgsm", "metric":"accuracy", - "score":0.6 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sv", "task":"mmlu", "metric":"accuracy", - "score":0.7 + "score":0.5 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sv", "task":"translation_from", "metric":"bleu", - "score":0.2959760233 + "score":0.3258404036 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sv", "task":"translation_from", "metric":"chrf", - "score":0.5398896148 + "score":0.5652149653 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sv", "task":"translation_to", "metric":"bleu", - "score":0.4357891553 + "score":0.4264864443 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sv", "task":"translation_to", "metric":"chrf", - "score":0.6529723913 + "score":0.6543542662 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sw", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sw", "task":"mgsm", "metric":"accuracy", "score":0.8 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sw", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.6 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.2501435914 + "score":0.268709657 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.5088299265 + "score":0.5306834056 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sw", "task":"translation_to", "metric":"bleu", - "score":0.262372343 + "score":0.3395981599 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"sw", "task":"translation_to", "metric":"chrf", - "score":0.5806899403 + "score":0.6130756934 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ta", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ta", "task":"translation_from", "metric":"bleu", - "score":0.2450100573 + "score":0.2563448403 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ta", "task":"translation_from", "metric":"chrf", - "score":0.4918691312 + "score":0.5007966916 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ta", "task":"translation_to", "metric":"bleu", - "score":0.2434733519 + "score":0.2405135195 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ta", "task":"translation_to", "metric":"chrf", - "score":0.5120095348 + "score":0.5564984925 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"te", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"te", "task":"mgsm", "metric":"accuracy", - "score":0.6 + "score":0.7 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"te", "task":"mmlu", "metric":"accuracy", - "score":0.6 + "score":0.2 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.3568851036 + "score":0.2787922254 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.5825326367 + "score":0.5420797212 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"te", "task":"translation_to", "metric":"bleu", - "score":0.3112091725 + "score":0.259866454 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"te", "task":"translation_to", "metric":"chrf", - "score":0.5431414206 + "score":0.48543634 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"tg", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"tg", "task":"translation_from", "metric":"bleu", - "score":0.1741933649 + "score":0.2018690154 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"tg", "task":"translation_from", "metric":"chrf", - "score":0.4272342177 + "score":0.4335923466 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"tg", "task":"translation_to", "metric":"bleu", - "score":0.1811584685 + "score":0.0972794658 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"tg", "task":"translation_to", "metric":"chrf", - "score":0.4001890626 + "score":0.327182503 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"th", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"th", "task":"mgsm", "metric":"accuracy", - "score":0.5 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"th", "task":"translation_from", "metric":"bleu", - "score":0.2544201673 + "score":0.2400131449 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"th", "task":"translation_from", "metric":"chrf", - "score":0.5081271409 + "score":0.4851690277 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"th", "task":"translation_to", "metric":"bleu", - "score":0.2942923294 + "score":0.383380628 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"th", "task":"translation_to", "metric":"chrf", - "score":0.4479604827 + "score":0.5430720239 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ti", "task":"classification", "metric":"accuracy", "score":1.0 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ti", "task":"translation_from", "metric":"bleu", - "score":0.0881111208 + "score":0.0736674948 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ti", "task":"translation_from", "metric":"chrf", - "score":0.3173214379 + "score":0.2974206944 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ti", "task":"translation_to", "metric":"bleu", - "score":0.0384668791 + "score":0.0241026131 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ti", "task":"translation_to", "metric":"chrf", - "score":0.1259439982 + "score":0.1246172628 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"tr", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"tr", "task":"mmlu", "metric":"accuracy", - "score":0.8 + "score":0.4 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"tr", "task":"translation_from", "metric":"bleu", - "score":0.2563119866 + "score":0.2757340333 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"tr", "task":"translation_from", "metric":"chrf", - "score":0.5291012922 + "score":0.5244536559 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"tr", "task":"translation_to", "metric":"bleu", - "score":0.3009595898 + "score":0.3185578758 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"tr", "task":"translation_to", "metric":"chrf", - "score":0.5854044281 + "score":0.5765088485 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"uk", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"uk", "task":"mmlu", "metric":"accuracy", "score":0.7 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"uk", "task":"translation_from", "metric":"bleu", - "score":0.2567288533 + "score":0.2918547905 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"uk", "task":"translation_from", "metric":"chrf", - "score":0.5177571061 + "score":0.5631912653 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"uk", "task":"translation_to", "metric":"bleu", - "score":0.3201007033 + "score":0.3283437369 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"uk", "task":"translation_to", "metric":"chrf", - "score":0.5323037228 + "score":0.5565790802 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"umb", "task":"classification", "metric":"accuracy", - "score":0.7 + "score":0.4 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"umb", "task":"translation_from", "metric":"bleu", - "score":0.0115980217 + "score":0.0359452883 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"umb", "task":"translation_from", "metric":"chrf", - "score":0.115883071 + "score":0.1779043042 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"umb", "task":"translation_to", "metric":"bleu", - "score":0.0129780747 + "score":0.0305779168 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"umb", "task":"translation_to", "metric":"chrf", - "score":0.1450749981 + "score":0.1838354035 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ur", "task":"classification", "metric":"accuracy", "score":0.9 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":0.2402951661 + "score":0.2595582459 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":0.5033005385 + "score":0.5043992681 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ur", "task":"translation_to", "metric":"bleu", - "score":0.2302239803 + "score":0.2142625601 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"ur", "task":"translation_to", "metric":"chrf", - "score":0.4066956434 + "score":0.429749938 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"uz", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"uz", "task":"translation_from", "metric":"bleu", - "score":0.203750264 + "score":0.2595944841 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"uz", "task":"translation_from", "metric":"chrf", - "score":0.4979829233 + "score":0.5081810113 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"uz", "task":"translation_to", "metric":"bleu", - "score":0.2162945849 + "score":0.2601189518 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"uz", "task":"translation_to", "metric":"chrf", - "score":0.4941278712 + "score":0.5225655991 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"vi", "task":"classification", "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"bleu", - "score":0.2537752957 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_from", - "metric":"chrf", - "score":0.5073147534 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"vi", - "task":"translation_to", - "metric":"bleu", - "score":0.3583753747 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5-8b", + "model":"google\/gemma-3-27b-it", "bcp_47":"vi", - "task":"translation_to", - "metric":"chrf", - "score":0.6253917282 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"wo", - "task":"classification", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"wo", - "task":"mgsm", - "metric":"accuracy", - "score":0.0 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"wo", "task":"mmlu", "metric":"accuracy", - "score":0.2 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"wo", - "task":"translation_from", - "metric":"bleu", - "score":0.1081430594 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"wo", - "task":"translation_from", - "metric":"chrf", - "score":0.2665454299 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"wo", - "task":"translation_to", - "metric":"bleu", - "score":0.0142970887 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"wo", - "task":"translation_to", - "metric":"chrf", - "score":0.1489810124 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"wuu", - "task":"classification", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"wuu", - "task":"translation_from", - "metric":"bleu", - "score":0.1700904158 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"wuu", - "task":"translation_from", - "metric":"chrf", - "score":0.421111634 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"wuu", - "task":"translation_to", - "metric":"bleu", - "score":0.1213993524 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"wuu", - "task":"translation_to", - "metric":"chrf", - "score":0.1655788185 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"xh", - "task":"classification", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"xh", - "task":"mgsm", - "metric":"accuracy", "score":0.4 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"xh", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"xh", + "model":"google\/gemma-3-27b-it", + "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.1531171972 + "score":0.2279880384 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"xh", + "model":"google\/gemma-3-27b-it", + "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.3828830786 + "score":0.4835933272 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"xh", + "model":"google\/gemma-3-27b-it", + "bcp_47":"vi", "task":"translation_to", "metric":"bleu", - "score":0.0483942569 + "score":0.3478085621 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"xh", + "model":"google\/gemma-3-27b-it", + "bcp_47":"vi", "task":"translation_to", "metric":"chrf", - "score":0.3116951706 + "score":0.5968604742 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"yo", + "model":"google\/gemma-3-27b-it", + "bcp_47":"wo", "task":"classification", "metric":"accuracy", - "score":1.0 + "score":0.8 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"yo", + "model":"google\/gemma-3-27b-it", + "bcp_47":"wo", "task":"mgsm", "metric":"accuracy", - "score":0.5 + "score":0.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"yo", + "model":"google\/gemma-3-27b-it", + "bcp_47":"wo", "task":"mmlu", "metric":"accuracy", - "score":0.4 + "score":0.2 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"yo", + "model":"google\/gemma-3-27b-it", + "bcp_47":"wo", "task":"translation_from", "metric":"bleu", - "score":0.0816098185 + "score":0.065945115 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"yo", + "model":"google\/gemma-3-27b-it", + "bcp_47":"wo", "task":"translation_from", "metric":"chrf", - "score":0.2781732759 + "score":0.2358663461 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"yo", + "model":"google\/gemma-3-27b-it", + "bcp_47":"wo", "task":"translation_to", "metric":"bleu", - "score":0.041496472 + "score":0.0540055322 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"yo", + "model":"google\/gemma-3-27b-it", + "bcp_47":"wo", "task":"translation_to", "metric":"chrf", - "score":0.202397124 + "score":0.2390749172 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"yue", + "model":"google\/gemma-3-27b-it", + "bcp_47":"wuu", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"yue", + "model":"google\/gemma-3-27b-it", + "bcp_47":"wuu", "task":"translation_from", "metric":"bleu", - "score":0.1783312983 + "score":0.246042863 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"yue", + "model":"google\/gemma-3-27b-it", + "bcp_47":"wuu", "task":"translation_from", "metric":"chrf", - "score":0.4423885999 + "score":0.4917114856 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"yue", + "model":"google\/gemma-3-27b-it", + "bcp_47":"wuu", "task":"translation_to", "metric":"bleu", - "score":0.1632112014 + "score":0.1017188886 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"yue", + "model":"google\/gemma-3-27b-it", + "bcp_47":"wuu", "task":"translation_to", "metric":"chrf", - "score":0.2297357227 + "score":0.1707828137 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", + "model":"google\/gemma-3-27b-it", + "bcp_47":"xh", "task":"classification", "metric":"accuracy", - "score":0.9 + "score":1.0 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", + "model":"google\/gemma-3-27b-it", + "bcp_47":"xh", "task":"mgsm", "metric":"accuracy", - "score":0.7 + "score":0.6 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", + "model":"google\/gemma-3-27b-it", + "bcp_47":"xh", "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.4 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", + "model":"google\/gemma-3-27b-it", + "bcp_47":"xh", "task":"translation_from", "metric":"bleu", - "score":0.249810194 + "score":0.167004472 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", + "model":"google\/gemma-3-27b-it", + "bcp_47":"xh", "task":"translation_from", "metric":"chrf", - "score":0.5151255506 + "score":0.400944552 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", + "model":"google\/gemma-3-27b-it", + "bcp_47":"xh", "task":"translation_to", "metric":"bleu", - "score":0.1854861198 + "score":0.066271851 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zh", + "model":"google\/gemma-3-27b-it", + "bcp_47":"xh", "task":"translation_to", "metric":"chrf", - "score":0.2463326959 + "score":0.3937495329 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zu", + "model":"google\/gemma-3-27b-it", + "bcp_47":"yo", "task":"classification", "metric":"accuracy", - "score":0.8 + "score":0.7 }, { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zu", + "model":"google\/gemma-3-27b-it", + "bcp_47":"yo", "task":"mgsm", "metric":"accuracy", "score":0.2 }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zu", - "task":"mmlu", - "metric":"accuracy", - "score":0.5 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zu", - "task":"translation_from", - "metric":"bleu", - "score":0.1729786376 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zu", - "task":"translation_from", - "metric":"chrf", - "score":0.4189697233 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zu", - "task":"translation_to", - "metric":"bleu", - "score":0.0866404913 - }, - { - "model":"google\/gemini-flash-1.5-8b", - "bcp_47":"zu", - "task":"translation_to", - "metric":"chrf", - "score":0.3943277627 - }, { "model":"google\/gemma-3-27b-it", - "bcp_47":"aeb", - "task":"classification", + "bcp_47":"yo", + "task":"mmlu", "metric":"accuracy", - "score":0.9 + "score":0.2 }, { "model":"google\/gemma-3-27b-it", - "bcp_47":"aeb", + "bcp_47":"yo", "task":"translation_from", "metric":"bleu", - "score":0.2177971147 + "score":0.0472060067 }, { "model":"google\/gemma-3-27b-it", - "bcp_47":"aeb", + "bcp_47":"yo", "task":"translation_from", "metric":"chrf", - "score":0.4738076987 + "score":0.2924612708 }, { "model":"google\/gemma-3-27b-it", - "bcp_47":"aeb", + "bcp_47":"yo", "task":"translation_to", "metric":"bleu", - "score":0.1414064724 + "score":0.0525309984 }, { "model":"google\/gemma-3-27b-it", - "bcp_47":"aeb", + "bcp_47":"yo", "task":"translation_to", "metric":"chrf", - "score":0.3965739567 + "score":0.2304098638 }, { "model":"google\/gemma-3-27b-it", - "bcp_47":"af", + "bcp_47":"yue", "task":"classification", "metric":"accuracy", - "score":0.0 + "score":1.0 }, { "model":"google\/gemma-3-27b-it", - "bcp_47":"af", + "bcp_47":"yue", "task":"translation_from", "metric":"bleu", - "score":0.0 + "score":0.2124709579 }, { "model":"google\/gemma-3-27b-it", - "bcp_47":"af", + "bcp_47":"yue", "task":"translation_from", "metric":"chrf", - "score":0.0 + "score":0.4811646042 }, { "model":"google\/gemma-3-27b-it", - "bcp_47":"af", + "bcp_47":"yue", "task":"translation_to", "metric":"bleu", - "score":0.0 + "score":0.1392232 }, { "model":"google\/gemma-3-27b-it", - "bcp_47":"af", + "bcp_47":"yue", "task":"translation_to", "metric":"chrf", - "score":0.0 + "score":0.2205120991 }, { "model":"google\/gemma-3-27b-it", - "bcp_47":"ak", + "bcp_47":"zh", "task":"classification", "metric":"accuracy", - "score":0.7 + "score":1.0 }, { "model":"google\/gemma-3-27b-it", - "bcp_47":"ak", + "bcp_47":"zh", "task":"mgsm", "metric":"accuracy", - "score":0.1 + "score":0.8 }, { "model":"google\/gemma-3-27b-it", - "bcp_47":"ak", + "bcp_47":"zh", "task":"mmlu", "metric":"accuracy", - "score":0.1 + "score":0.5 }, { "model":"google\/gemma-3-27b-it", - "bcp_47":"ak", + "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.076595229 + "score":0.1900086584 }, { "model":"google\/gemma-3-27b-it", - "bcp_47":"ak", + "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.2493366365 + "score":0.4895930442 }, { "model":"google\/gemma-3-27b-it", - "bcp_47":"ak", + "bcp_47":"zh", "task":"translation_to", "metric":"bleu", - "score":0.0440715947 + "score":0.2395565562 }, { "model":"google\/gemma-3-27b-it", - "bcp_47":"ak", + "bcp_47":"zh", "task":"translation_to", "metric":"chrf", - "score":0.2820233612 + "score":0.3237759485 }, { "model":"google\/gemma-3-27b-it", - "bcp_47":"am", + "bcp_47":"zu", "task":"classification", "metric":"accuracy", "score":1.0 }, { "model":"google\/gemma-3-27b-it", - "bcp_47":"am", + "bcp_47":"zu", "task":"mgsm", "metric":"accuracy", - "score":0.8 + "score":0.6 }, { "model":"google\/gemma-3-27b-it", - "bcp_47":"am", + "bcp_47":"zu", "task":"mmlu", "metric":"accuracy", - "score":0.3 + "score":0.4 }, { "model":"google\/gemma-3-27b-it", - "bcp_47":"am", + "bcp_47":"zu", "task":"translation_from", "metric":"bleu", - "score":0.1913062339 + "score":0.1607803472 }, { "model":"google\/gemma-3-27b-it", - "bcp_47":"am", + "bcp_47":"zu", "task":"translation_from", "metric":"chrf", - "score":0.4296053228 + "score":0.4377738064 }, { "model":"google\/gemma-3-27b-it", - "bcp_47":"am", + "bcp_47":"zu", "task":"translation_to", "metric":"bleu", - "score":0.13443556 + "score":0.1538390263 }, { "model":"google\/gemma-3-27b-it", - "bcp_47":"am", + "bcp_47":"zu", "task":"translation_to", "metric":"chrf", - "score":0.2528930204 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"apc", - "task":"classification", - "metric":"accuracy", - "score":1.0 + "score":0.4751516021 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"apc", + "model":"google\/translate-v2", + "bcp_47":"aeb", "task":"translation_from", "metric":"bleu", - "score":0.24265587 + "score":0.3397504765 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"apc", + "model":"google\/translate-v2", + "bcp_47":"aeb", "task":"translation_from", "metric":"chrf", - "score":0.4918380331 + "score":0.560449359 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"apc", + "model":"google\/translate-v2", + "bcp_47":"aeb", "task":"translation_to", "metric":"bleu", - "score":0.2104382871 + "score":0.278826715 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"apc", + "model":"google\/translate-v2", + "bcp_47":"aeb", "task":"translation_to", "metric":"chrf", - "score":0.456050442 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"classification", - "metric":"accuracy", - "score":1.0 + "score":0.4815690002 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", - "task":"mmlu", - "metric":"accuracy", - "score":0.4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", + "model":"google\/translate-v2", + "bcp_47":"ak", "task":"translation_from", "metric":"bleu", - "score":0.2891206499 + "score":0.2795001892 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", + "model":"google\/translate-v2", + "bcp_47":"ak", "task":"translation_from", "metric":"chrf", - "score":0.5438550217 + "score":0.5119662189 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", + "model":"google\/translate-v2", + "bcp_47":"ak", "task":"translation_to", "metric":"bleu", - "score":0.3184721364 + "score":0.1719218154 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ar", + "model":"google\/translate-v2", + "bcp_47":"ak", "task":"translation_to", "metric":"chrf", - "score":0.5483731849 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ary", - "task":"classification", - "metric":"accuracy", - "score":1.0 + "score":0.4619906072 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ary", + "model":"google\/translate-v2", + "bcp_47":"am", "task":"translation_from", "metric":"bleu", - "score":0.1664804364 + "score":0.2955792162 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ary", + "model":"google\/translate-v2", + "bcp_47":"am", "task":"translation_from", "metric":"chrf", - "score":0.4585261833 + "score":0.5460142346 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ary", + "model":"google\/translate-v2", + "bcp_47":"am", "task":"translation_to", "metric":"bleu", - "score":0.1299183594 + "score":0.2550661243 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ary", + "model":"google\/translate-v2", + "bcp_47":"am", "task":"translation_to", "metric":"chrf", - "score":0.3752977557 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", - "task":"classification", - "metric":"accuracy", - "score":1.0 + "score":0.3516234079 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", + "model":"google\/translate-v2", + "bcp_47":"apc", "task":"translation_from", "metric":"bleu", - "score":0.1618648119 + "score":0.3399225795 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", + "model":"google\/translate-v2", + "bcp_47":"apc", "task":"translation_from", "metric":"chrf", - "score":0.4104839109 + "score":0.5942330704 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", + "model":"google\/translate-v2", + "bcp_47":"apc", "task":"translation_to", "metric":"bleu", - "score":0.2266738862 + "score":0.2816905761 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"arz", + "model":"google\/translate-v2", + "bcp_47":"apc", "task":"translation_to", "metric":"chrf", - "score":0.4315390742 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"as", - "task":"classification", - "metric":"accuracy", - "score":1.0 + "score":0.5676475667 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"as", + "model":"google\/translate-v2", + "bcp_47":"ar", "task":"translation_from", "metric":"bleu", - "score":0.2602059805 + "score":0.3493985929 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"as", + "model":"google\/translate-v2", + "bcp_47":"ar", "task":"translation_from", "metric":"chrf", - "score":0.4987515978 + "score":0.5975748844 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"as", + "model":"google\/translate-v2", + "bcp_47":"ar", "task":"translation_to", "metric":"bleu", - "score":0.0907943093 + "score":0.3475330474 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"as", + "model":"google\/translate-v2", + "bcp_47":"ar", "task":"translation_to", "metric":"chrf", - "score":0.348768221 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"awa", - "task":"classification", - "metric":"accuracy", - "score":0.9 + "score":0.5776317086 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"awa", + "model":"google\/translate-v2", + "bcp_47":"ary", "task":"translation_from", "metric":"bleu", - "score":0.3277667824 + "score":0.2092670256 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"awa", + "model":"google\/translate-v2", + "bcp_47":"ary", "task":"translation_from", "metric":"chrf", - "score":0.5267403611 + "score":0.466339127 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"awa", + "model":"google\/translate-v2", + "bcp_47":"ary", "task":"translation_to", "metric":"bleu", - "score":0.2123273366 + "score":0.1728000073 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"awa", + "model":"google\/translate-v2", + "bcp_47":"ary", "task":"translation_to", "metric":"chrf", - "score":0.408906638 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"az", - "task":"classification", - "metric":"accuracy", - "score":1.0 + "score":0.4285875773 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"az", + "model":"google\/translate-v2", + "bcp_47":"arz", "task":"translation_from", "metric":"bleu", - "score":0.1880331404 + "score":0.2747967998 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"az", + "model":"google\/translate-v2", + "bcp_47":"arz", "task":"translation_from", "metric":"chrf", - "score":0.4234748209 + "score":0.5090740494 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"az", + "model":"google\/translate-v2", + "bcp_47":"arz", "task":"translation_to", "metric":"bleu", - "score":0.1517877566 + "score":0.2401570931 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"az", + "model":"google\/translate-v2", + "bcp_47":"arz", "task":"translation_to", "metric":"chrf", - "score":0.423956163 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"be", - "task":"classification", - "metric":"accuracy", - "score":1.0 + "score":0.4670149488 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"be", + "model":"google\/translate-v2", + "bcp_47":"as", "task":"translation_from", "metric":"bleu", - "score":0.148851004 + "score":0.2674941424 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"be", + "model":"google\/translate-v2", + "bcp_47":"as", "task":"translation_from", "metric":"chrf", - "score":0.4514291775 + "score":0.541891802 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"be", + "model":"google\/translate-v2", + "bcp_47":"as", "task":"translation_to", "metric":"bleu", - "score":0.3105472783 + "score":0.1979823055 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"be", + "model":"google\/translate-v2", + "bcp_47":"as", "task":"translation_to", "metric":"chrf", - "score":0.498684126 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bho", - "task":"classification", - "metric":"accuracy", - "score":1.0 + "score":0.4521218857 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bho", + "model":"google\/translate-v2", + "bcp_47":"awa", "task":"translation_from", "metric":"bleu", - "score":0.2430984589 + "score":0.3768023433 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bho", + "model":"google\/translate-v2", + "bcp_47":"awa", "task":"translation_from", "metric":"chrf", - "score":0.4969060141 + "score":0.6041064745 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bho", + "model":"google\/translate-v2", + "bcp_47":"awa", "task":"translation_to", "metric":"bleu", - "score":0.1699224465 + "score":0.2943485815 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bho", + "model":"google\/translate-v2", + "bcp_47":"awa", "task":"translation_to", "metric":"chrf", - "score":0.3964402252 + "score":0.5100804178 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bm", - "task":"classification", - "metric":"accuracy", - "score":0.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bm", + "model":"google\/translate-v2", + "bcp_47":"az", "task":"translation_from", "metric":"bleu", - "score":0.0 + "score":0.2273493056 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bm", + "model":"google\/translate-v2", + "bcp_47":"az", "task":"translation_from", "metric":"chrf", - "score":0.0 + "score":0.4822061401 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bm", + "model":"google\/translate-v2", + "bcp_47":"az", "task":"translation_to", "metric":"bleu", - "score":0.0 + "score":0.1907459838 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bm", + "model":"google\/translate-v2", + "bcp_47":"az", "task":"translation_to", "metric":"chrf", - "score":0.0 + "score":0.4304499853 + }, + { + "model":"google\/translate-v2", + "bcp_47":"be", + "task":"translation_from", + "metric":"bleu", + "score":0.2698506992 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"classification", - "metric":"accuracy", - "score":1.0 + "model":"google\/translate-v2", + "bcp_47":"be", + "task":"translation_from", + "metric":"chrf", + "score":0.5332909304 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"mgsm", - "metric":"accuracy", - "score":0.7 + "model":"google\/translate-v2", + "bcp_47":"be", + "task":"translation_to", + "metric":"bleu", + "score":0.3805163094 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", - "task":"mmlu", - "metric":"accuracy", - "score":0.3 + "model":"google\/translate-v2", + "bcp_47":"be", + "task":"translation_to", + "metric":"chrf", + "score":0.5444910857 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", + "model":"google\/translate-v2", + "bcp_47":"bho", "task":"translation_from", "metric":"bleu", - "score":0.2907230812 + "score":0.3207673833 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", + "model":"google\/translate-v2", + "bcp_47":"bho", "task":"translation_from", "metric":"chrf", - "score":0.5148223626 + "score":0.5578909014 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", + "model":"google\/translate-v2", + "bcp_47":"bho", "task":"translation_to", "metric":"bleu", - "score":0.3473636391 + "score":0.1931718671 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"bn", + "model":"google\/translate-v2", + "bcp_47":"bho", "task":"translation_to", "metric":"chrf", - "score":0.5442574441 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ca", - "task":"classification", - "metric":"accuracy", - "score":0.0 + "score":0.4102436779 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ca", + "model":"google\/translate-v2", + "bcp_47":"bn", "task":"translation_from", "metric":"bleu", - "score":0.0 + "score":0.2940937001 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ca", + "model":"google\/translate-v2", + "bcp_47":"bn", "task":"translation_from", "metric":"chrf", - "score":0.0 + "score":0.5656960013 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ca", + "model":"google\/translate-v2", + "bcp_47":"bn", "task":"translation_to", "metric":"bleu", - "score":0.0 + "score":0.4105743367 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ca", + "model":"google\/translate-v2", + "bcp_47":"bn", "task":"translation_to", "metric":"chrf", - "score":0.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ceb", - "task":"classification", - "metric":"accuracy", - "score":0.9 + "score":0.582274226 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ceb", "task":"translation_from", "metric":"bleu", - "score":0.3650597419 + "score":0.455106564 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ceb", "task":"translation_from", "metric":"chrf", - "score":0.5512750223 + "score":0.6691241367 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ceb", "task":"translation_to", "metric":"bleu", - "score":0.293824845 + "score":0.5332526559 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ceb", "task":"translation_to", "metric":"chrf", - "score":0.5724817779 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ckb", - "task":"classification", - "metric":"accuracy", - "score":0.9 + "score":0.7086055004 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ckb", "task":"translation_from", "metric":"bleu", - "score":0.1983726871 + "score":0.2827542245 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ckb", "task":"translation_from", "metric":"chrf", - "score":0.4779908235 + "score":0.5361942504 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ckb", "task":"translation_to", "metric":"bleu", - "score":0.0792877335 + "score":0.3935667187 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ckb", "task":"translation_to", "metric":"chrf", - "score":0.3908004248 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"cs", - "task":"classification", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"cs", - "task":"mgsm", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"cs", - "task":"mmlu", - "metric":"accuracy", - "score":0.4 + "score":0.6110160857 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"cs", "task":"translation_from", "metric":"bleu", - "score":0.2863884915 + "score":0.3504448262 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"cs", "task":"translation_from", "metric":"chrf", - "score":0.5641108436 + "score":0.6171883377 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"cs", "task":"translation_to", "metric":"bleu", - "score":0.352498756 + "score":0.4493928736 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"cs", "task":"translation_to", "metric":"chrf", - "score":0.5860513143 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"classification", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"de", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 + "score":0.6238587383 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"de", "task":"translation_from", "metric":"bleu", - "score":0.3577876868 + "score":0.4085073951 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"de", "task":"translation_from", "metric":"chrf", - "score":0.5943423055 + "score":0.6323019852 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"de", "task":"translation_to", "metric":"bleu", - "score":0.5344280565 + "score":0.5247754427 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"de", "task":"translation_to", "metric":"chrf", - "score":0.7084649844 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"el", - "task":"classification", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"el", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"el", - "task":"mmlu", - "metric":"accuracy", - "score":0.5 + "score":0.7142099767 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"el", "task":"translation_from", "metric":"bleu", - "score":0.2914236052 + "score":0.3267673394 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"el", "task":"translation_from", "metric":"chrf", - "score":0.5147962724 + "score":0.5607576056 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"el", "task":"translation_to", "metric":"bleu", - "score":0.3761179017 + "score":0.3745254965 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"el", "task":"translation_to", "metric":"chrf", - "score":0.5590147212 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"classification", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"mgsm", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"en", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 + "score":0.5676283692 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"en", "task":"translation_from", "metric":"bleu", - "score":0.452427177 + "score":0.6256942034 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"en", "task":"translation_from", "metric":"chrf", - "score":0.6525566656 + "score":0.7540191814 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"en", "task":"translation_to", "metric":"bleu", - "score":0.5467976399 + "score":0.70888051 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"en", "task":"translation_to", "metric":"chrf", - "score":0.7780833183 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"classification", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"mgsm", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"es", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 + "score":0.8684926816 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"es", "task":"translation_from", "metric":"bleu", - "score":0.3554331718 + "score":0.350374858 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"es", "task":"translation_from", "metric":"chrf", - "score":0.5997743406 + "score":0.5997407835 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"es", "task":"translation_to", "metric":"bleu", - "score":0.3847830842 + "score":0.3746387789 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"es", "task":"translation_to", "metric":"chrf", - "score":0.6191109047 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"classification", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fa", - "task":"mmlu", - "metric":"accuracy", - "score":0.4 + "score":0.6101421618 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"fa", "task":"translation_from", "metric":"bleu", - "score":0.2579194729 + "score":0.3295944742 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"fa", "task":"translation_from", "metric":"chrf", - "score":0.5351839762 + "score":0.5865092795 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"fa", "task":"translation_to", "metric":"bleu", - "score":0.1571676635 + "score":0.2930219204 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"fa", "task":"translation_to", "metric":"chrf", - "score":0.4046770996 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"classification", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fil", - "task":"mmlu", - "metric":"accuracy", - "score":0.4 + "score":0.5297678901 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"fil", "task":"translation_from", "metric":"bleu", - "score":0.3771043132 + "score":0.4111750064 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"fil", "task":"translation_from", "metric":"chrf", - "score":0.5835797455 + "score":0.6314637291 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"fil", "task":"translation_to", "metric":"bleu", - "score":0.3564426025 + "score":0.4316058282 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"fil", "task":"translation_to", "metric":"chrf", - "score":0.6107274367 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"classification", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"mgsm", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fr", - "task":"mmlu", - "metric":"accuracy", - "score":0.3 + "score":0.6598411557 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"fr", "task":"translation_from", "metric":"bleu", - "score":0.2846092378 + "score":0.3779603397 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"fr", "task":"translation_from", "metric":"chrf", - "score":0.5655970541 + "score":0.6286963509 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"fr", "task":"translation_to", "metric":"bleu", - "score":0.5192984544 + "score":0.5835846952 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"fr", "task":"translation_to", "metric":"chrf", - "score":0.7020040834 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"fuv", - "task":"classification", - "metric":"accuracy", - "score":0.7 + "score":0.7468900473 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"fuv", "task":"translation_from", "metric":"bleu", - "score":0.0220051815 + "score":0.1585736619 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"fuv", "task":"translation_from", "metric":"chrf", - "score":0.1861453784 + "score":0.3595908619 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"fuv", "task":"translation_to", "metric":"bleu", - "score":0.0227307294 + "score":0.0281783964 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"fuv", "task":"translation_to", "metric":"chrf", - "score":0.1850492522 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"gu", - "task":"classification", - "metric":"accuracy", - "score":1.0 + "score":0.2135990911 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"gu", "task":"translation_from", "metric":"bleu", - "score":0.2796934014 + "score":0.3338203117 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"gu", "task":"translation_from", "metric":"chrf", - "score":0.5155626456 + "score":0.550900416 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"gu", "task":"translation_to", "metric":"bleu", - "score":0.1979202011 + "score":0.2235904654 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"gu", "task":"translation_to", "metric":"chrf", - "score":0.4528880823 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"classification", - "metric":"accuracy", - "score":0.9 + "score":0.4889537149 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ha", - "task":"mmlu", - "metric":"accuracy", - "score":0.3 - }, - { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ha", "task":"translation_from", "metric":"bleu", - "score":0.1595296755 + "score":0.3014462049 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ha", "task":"translation_from", "metric":"chrf", - "score":0.3859356797 + "score":0.5332346012 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ha", "task":"translation_to", "metric":"bleu", - "score":0.171830216 + "score":0.2941569015 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ha", "task":"translation_to", "metric":"chrf", - "score":0.4608354018 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"classification", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hi", - "task":"mmlu", - "metric":"accuracy", - "score":0.5 + "score":0.5452786239 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"hi", "task":"translation_from", "metric":"bleu", - "score":0.3520691191 + "score":0.432237812 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"hi", "task":"translation_from", "metric":"chrf", - "score":0.6035990708 + "score":0.6378291521 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"hi", "task":"translation_to", "metric":"bleu", - "score":0.3987037224 + "score":0.4001439439 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"hi", "task":"translation_to", "metric":"chrf", - "score":0.6195037668 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hne", - "task":"classification", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hne", - "task":"translation_from", - "metric":"bleu", - "score":0.2709410734 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hne", - "task":"translation_from", - "metric":"chrf", - "score":0.4976144005 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hne", - "task":"translation_to", - "metric":"bleu", - "score":0.1150407607 + "score":0.6257483281 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"hne", - "task":"translation_to", - "metric":"chrf", - "score":0.3709160058 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ht", - "task":"classification", - "metric":"accuracy", - "score":0.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ht", "task":"translation_from", "metric":"bleu", "score":0.0 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ht", + "model":"google\/translate-v2", + "bcp_47":"hne", "task":"translation_from", "metric":"chrf", "score":0.0 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ht", + "model":"google\/translate-v2", + "bcp_47":"hne", "task":"translation_to", "metric":"bleu", "score":0.0 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ht", + "model":"google\/translate-v2", + "bcp_47":"hne", "task":"translation_to", "metric":"chrf", "score":0.0 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hu", - "task":"classification", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"hu", - "task":"mgsm", - "metric":"accuracy", - "score":0.5 - }, - { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"hu", "task":"translation_from", "metric":"bleu", - "score":0.2903150375 + "score":0.3369838412 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"hu", "task":"translation_from", "metric":"chrf", - "score":0.5392715859 + "score":0.564308487 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"hu", "task":"translation_to", "metric":"bleu", - "score":0.3460432788 + "score":0.4344044669 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"hu", "task":"translation_to", "metric":"chrf", - "score":0.6009670508 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"classification", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"mmlu", - "metric":"accuracy", - "score":0.3 + "score":0.6654473209 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"id", "task":"translation_from", "metric":"bleu", - "score":0.3377417704 + "score":0.3943233817 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"id", "task":"translation_from", "metric":"chrf", - "score":0.5674360496 + "score":0.6168947522 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"id", - "task":"translation_to", - "metric":"bleu", - "score":0.3534620252 - }, - { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"id", "task":"translation_to", - "metric":"chrf", - "score":0.6680177029 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ig", - "task":"classification", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ig", - "task":"mgsm", - "metric":"accuracy", - "score":0.6 + "metric":"bleu", + "score":0.5116660025 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ig", - "task":"mmlu", - "metric":"accuracy", - "score":0.2 + "model":"google\/translate-v2", + "bcp_47":"id", + "task":"translation_to", + "metric":"chrf", + "score":0.730698655 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ig", "task":"translation_from", "metric":"bleu", - "score":0.1600009223 + "score":0.3708158915 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ig", "task":"translation_from", "metric":"chrf", - "score":0.3857586031 + "score":0.5993132477 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ig", "task":"translation_to", "metric":"bleu", - "score":0.1602266912 + "score":0.2705214178 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ig", "task":"translation_to", "metric":"chrf", - "score":0.4091024664 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ilo", - "task":"classification", - "metric":"accuracy", - "score":1.0 + "score":0.504548883 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ilo", "task":"translation_from", "metric":"bleu", - "score":0.1546473042 + "score":0.3900081426 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ilo", "task":"translation_from", "metric":"chrf", - "score":0.3985794204 + "score":0.6052122639 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ilo", "task":"translation_to", "metric":"bleu", - "score":0.1752645287 + "score":0.3336718595 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ilo", "task":"translation_to", "metric":"chrf", - "score":0.4668449261 + "score":0.5750387432 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"classification", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"it", - "task":"mmlu", - "metric":"accuracy", - "score":0.2 - }, - { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"it", "task":"translation_from", "metric":"bleu", - "score":0.3356485456 + "score":0.3278554945 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"it", "task":"translation_from", "metric":"chrf", - "score":0.5684527887 + "score":0.5743022789 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"it", "task":"translation_to", "metric":"bleu", - "score":0.3627134123 + "score":0.3394020951 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"it", "task":"translation_to", "metric":"chrf", - "score":0.6050822949 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"classification", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ja", - "task":"mmlu", - "metric":"accuracy", - "score":0.4 + "score":0.5938537899 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ja", "task":"translation_from", "metric":"bleu", - "score":0.2481856237 + "score":0.3409989486 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ja", "task":"translation_from", "metric":"chrf", - "score":0.5180749152 + "score":0.5959288844 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ja", "task":"translation_to", "metric":"bleu", - "score":0.242508046 + "score":0.3711980077 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ja", "task":"translation_to", "metric":"chrf", - "score":0.4046420215 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"jv", - "task":"classification", - "metric":"accuracy", - "score":0.9 + "score":0.4848412412 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"jv", "task":"translation_from", "metric":"bleu", - "score":0.3019627022 + "score":0.3673114251 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"jv", "task":"translation_from", "metric":"chrf", - "score":0.5133980923 + "score":0.6183652016 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"jv", "task":"translation_to", "metric":"bleu", - "score":0.2316517545 + "score":0.3709969529 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"jv", "task":"translation_to", "metric":"chrf", - "score":0.5189963647 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ki", - "task":"classification", - "metric":"accuracy", - "score":0.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ki", - "task":"translation_from", - "metric":"bleu", - "score":0.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ki", - "task":"translation_from", - "metric":"chrf", - "score":0.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ki", - "task":"translation_to", - "metric":"bleu", - "score":0.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ki", - "task":"translation_to", - "metric":"chrf", - "score":0.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kk", - "task":"classification", - "metric":"accuracy", - "score":1.0 + "score":0.598464243 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"kk", "task":"translation_from", "metric":"bleu", - "score":0.2187004813 + "score":0.3570145905 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"kk", "task":"translation_from", "metric":"chrf", - "score":0.4910590831 + "score":0.5887718416 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"kk", "task":"translation_to", "metric":"bleu", - "score":0.2108939118 + "score":0.3713033391 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"kk", "task":"translation_to", "metric":"chrf", - "score":0.4375825873 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"km", - "task":"classification", - "metric":"accuracy", - "score":0.9 + "score":0.604716209 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"km", "task":"translation_from", "metric":"bleu", - "score":0.3274744668 + "score":0.3851664104 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"km", "task":"translation_from", "metric":"chrf", - "score":0.5605813039 + "score":0.6312237305 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"km", "task":"translation_to", "metric":"bleu", - "score":0.0800539722 + "score":0.1874455996 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"km", "task":"translation_to", "metric":"chrf", - "score":0.3336188156 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"kn", - "task":"classification", - "metric":"accuracy", - "score":1.0 + "score":0.4426393743 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"kn", "task":"translation_from", "metric":"bleu", - "score":0.2692189197 + "score":0.3113098415 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"kn", "task":"translation_from", "metric":"chrf", - "score":0.5290912174 + "score":0.5501022834 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"kn", "task":"translation_to", "metric":"bleu", - "score":0.2869741566 + "score":0.3347737931 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"kn", "task":"translation_to", "metric":"chrf", - "score":0.5072256514 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"classification", - "metric":"accuracy", - "score":0.9 + "score":0.5576944014 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ko", - "task":"mmlu", - "metric":"accuracy", - "score":0.3 - }, - { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ko", "task":"translation_from", "metric":"bleu", - "score":0.2172591082 + "score":0.2822808126 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ko", "task":"translation_from", "metric":"chrf", - "score":0.478962626 + "score":0.5526101149 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ko", "task":"translation_to", "metric":"bleu", - "score":0.2169046229 + "score":0.2612977966 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ko", "task":"translation_to", "metric":"chrf", - "score":0.3151387909 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"lua", - "task":"classification", - "metric":"accuracy", - "score":0.7 + "score":0.3457225363 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"lua", "task":"translation_from", "metric":"bleu", - "score":0.0905061152 + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"lua", "task":"translation_from", "metric":"chrf", - "score":0.321707617 + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"lua", "task":"translation_to", "metric":"bleu", - "score":0.0361920973 + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"lua", "task":"translation_to", "metric":"chrf", - "score":0.222315171 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mag", - "task":"classification", - "metric":"accuracy", - "score":1.0 + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"mag", "task":"translation_from", "metric":"bleu", - "score":0.3100950481 + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"mag", "task":"translation_from", "metric":"chrf", - "score":0.558054933 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mag", - "task":"translation_to", - "metric":"bleu", - "score":0.2213152575 + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"mag", "task":"translation_to", - "metric":"chrf", - "score":0.4821662369 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mai", - "task":"classification", - "metric":"accuracy", - "score":1.0 + "metric":"bleu", + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", + "bcp_47":"mag", + "task":"translation_to", + "metric":"chrf", + "score":0.0 + }, + { + "model":"google\/translate-v2", "bcp_47":"mai", "task":"translation_from", "metric":"bleu", - "score":0.3126340837 + "score":0.3348942842 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"mai", "task":"translation_from", "metric":"chrf", - "score":0.5601639768 + "score":0.5861344551 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"mai", "task":"translation_to", "metric":"bleu", - "score":0.1875297747 + "score":0.1311732143 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"mai", "task":"translation_to", "metric":"chrf", - "score":0.4394137195 + "score":0.4350789061 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mg", - "task":"classification", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mg", - "task":"mmlu", - "metric":"accuracy", - "score":0.4 - }, - { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"mg", "task":"translation_from", "metric":"bleu", - "score":0.2502298144 + "score":0.2903894802 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"mg", "task":"translation_from", "metric":"chrf", - "score":0.5206889602 + "score":0.5623472971 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"mg", "task":"translation_to", "metric":"bleu", - "score":0.1301910408 + "score":0.2190660395 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"mg", "task":"translation_to", "metric":"chrf", - "score":0.4488625613 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ml", - "task":"classification", - "metric":"accuracy", - "score":1.0 + "score":0.5006362228 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ml", "task":"translation_from", "metric":"bleu", - "score":0.2809005667 + "score":0.339831623 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ml", "task":"translation_from", "metric":"chrf", - "score":0.5466717628 + "score":0.590846484 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ml", "task":"translation_to", "metric":"bleu", - "score":0.2287455417 + "score":0.3016318322 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ml", "task":"translation_to", "metric":"chrf", - "score":0.4915489263 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"mr", - "task":"classification", - "metric":"accuracy", - "score":1.0 + "score":0.5461894184 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"mr", "task":"translation_from", "metric":"bleu", - "score":0.3395095603 + "score":0.3491068707 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"mr", "task":"translation_from", "metric":"chrf", - "score":0.5877742809 + "score":0.5803894973 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"mr", "task":"translation_to", "metric":"bleu", - "score":0.2222923122 + "score":0.3274616019 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"mr", "task":"translation_to", "metric":"chrf", - "score":0.4572688692 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ms", - "task":"classification", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ms", - "task":"mmlu", - "metric":"accuracy", - "score":0.2 + "score":0.5109521029 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ms", "task":"translation_from", "metric":"bleu", - "score":0.3794800258 + "score":0.3962757824 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ms", "task":"translation_from", "metric":"chrf", - "score":0.6256125923 + "score":0.6224286451 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ms", "task":"translation_to", "metric":"bleu", - "score":0.3593747877 + "score":0.5032472209 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ms", "task":"translation_to", "metric":"chrf", - "score":0.664135376 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"my", - "task":"classification", - "metric":"accuracy", - "score":1.0 + "score":0.7257127115 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"my", "task":"translation_from", "metric":"bleu", - "score":0.251920694 + "score":0.3361081405 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"my", "task":"translation_from", "metric":"chrf", - "score":0.4662583176 + "score":0.5602875655 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"my", "task":"translation_to", "metric":"bleu", - "score":0.1647980206 + "score":0.282320421 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"my", "task":"translation_to", "metric":"chrf", - "score":0.4166796691 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ne", - "task":"classification", - "metric":"accuracy", - "score":0.9 + "score":0.4830195157 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ne", - "task":"mmlu", - "metric":"accuracy", - "score":0.4 - }, - { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ne", "task":"translation_from", "metric":"bleu", - "score":0.3022338928 + "score":0.339447252 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ne", "task":"translation_from", "metric":"chrf", - "score":0.5587522289 + "score":0.5865985454 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ne", "task":"translation_to", "metric":"bleu", - "score":0.2252421952 + "score":0.3120075365 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ne", "task":"translation_to", "metric":"chrf", - "score":0.4768786292 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"nl", - "task":"classification", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"nl", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"nl", - "task":"mmlu", - "metric":"accuracy", - "score":0.4 + "score":0.5354876043 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"nl", "task":"translation_from", "metric":"bleu", - "score":0.2793746981 + "score":0.3500838996 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"nl", "task":"translation_from", "metric":"chrf", - "score":0.5246312011 + "score":0.5820135911 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"nl", "task":"translation_to", "metric":"bleu", - "score":0.3496466203 + "score":0.3833463355 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"nl", "task":"translation_to", "metric":"chrf", - "score":0.6032151622 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ny", - "task":"classification", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ny", - "task":"mmlu", - "metric":"accuracy", - "score":0.3 + "score":0.630764328 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ny", "task":"translation_from", "metric":"bleu", - "score":0.119086784 + "score":0.2752866209 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ny", "task":"translation_from", "metric":"chrf", - "score":0.3898511388 + "score":0.5470670325 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ny", "task":"translation_to", "metric":"bleu", - "score":0.0923649849 + "score":0.2362408388 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ny", "task":"translation_to", "metric":"chrf", - "score":0.4837931302 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"om", - "task":"classification", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"om", - "task":"mgsm", - "metric":"accuracy", - "score":0.1 + "score":0.5649412405 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"om", - "task":"mmlu", - "metric":"accuracy", - "score":0.2 - }, - { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"om", "task":"translation_from", "metric":"bleu", - "score":0.0417850648 + "score":0.2628008901 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"om", "task":"translation_from", "metric":"chrf", - "score":0.2509675066 + "score":0.5081811686 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"om", "task":"translation_to", "metric":"bleu", - "score":0.0312813941 + "score":0.0993493347 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"om", "task":"translation_to", "metric":"chrf", - "score":0.2886309955 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"or", - "task":"classification", - "metric":"accuracy", - "score":0.9 + "score":0.456860433 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"or", "task":"translation_from", "metric":"bleu", - "score":0.2613495089 + "score":0.3258874325 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"or", "task":"translation_from", "metric":"chrf", - "score":0.5009335042 + "score":0.5886625327 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"or", "task":"translation_to", "metric":"bleu", - "score":0.1648455996 + "score":0.321631251 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"or", "task":"translation_to", "metric":"chrf", - "score":0.3943041737 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"classification", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_from", - "metric":"bleu", - "score":0.4164890636 + "score":0.5362369434 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"pa", "task":"translation_from", - "metric":"chrf", - "score":0.6375470445 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pa", - "task":"translation_to", "metric":"bleu", - "score":0.4166823661 + "score":0.4482674529 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"pa", - "task":"translation_to", - "metric":"chrf", - "score":0.575314128 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"classification", - "metric":"accuracy", - "score":0.9 + "task":"translation_from", + "metric":"chrf", + "score":0.671945393 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"mgsm", - "metric":"accuracy", - "score":0.9 + "model":"google\/translate-v2", + "bcp_47":"pa", + "task":"translation_to", + "metric":"bleu", + "score":0.5160129517 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pl", - "task":"mmlu", - "metric":"accuracy", - "score":0.2 + "model":"google\/translate-v2", + "bcp_47":"pa", + "task":"translation_to", + "metric":"chrf", + "score":0.6445374779 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"pl", "task":"translation_from", "metric":"bleu", - "score":0.2913506513 + "score":0.3157581247 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"pl", "task":"translation_from", "metric":"chrf", - "score":0.5431985912 + "score":0.5682347228 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"pl", "task":"translation_to", "metric":"bleu", - "score":0.3723742743 + "score":0.3771434243 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"pl", "task":"translation_to", "metric":"chrf", - "score":0.5891983505 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"classification", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"pt", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 + "score":0.6045220423 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"pt", "task":"translation_from", "metric":"bleu", - "score":0.340245547 + "score":0.3489983932 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"pt", "task":"translation_from", "metric":"chrf", - "score":0.5681284927 + "score":0.5800455435 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"pt", "task":"translation_to", "metric":"bleu", - "score":0.4702737577 + "score":0.5650298473 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"pt", "task":"translation_to", "metric":"chrf", - "score":0.6903236014 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ro", - "task":"classification", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ro", - "task":"mgsm", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ro", - "task":"mmlu", - "metric":"accuracy", - "score":0.5 + "score":0.7365285421 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ro", "task":"translation_from", "metric":"bleu", - "score":0.272965046 + "score":0.3390274579 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ro", "task":"translation_from", "metric":"chrf", - "score":0.5527916308 + "score":0.592940935 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ro", "task":"translation_to", "metric":"bleu", - "score":0.5195197328 + "score":0.5470657372 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ro", "task":"translation_to", "metric":"chrf", - "score":0.6892729705 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"classification", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ru", - "task":"mmlu", - "metric":"accuracy", - "score":0.3 + "score":0.7020072444 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ru", "task":"translation_from", "metric":"bleu", - "score":0.2862936285 + "score":0.3013142128 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ru", "task":"translation_from", "metric":"chrf", - "score":0.5264436928 + "score":0.5656623498 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ru", "task":"translation_to", "metric":"bleu", - "score":0.4800957551 + "score":0.5178438056 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ru", "task":"translation_to", "metric":"chrf", - "score":0.6618495803 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"rw", - "task":"classification", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"rw", - "task":"mgsm", - "metric":"accuracy", - "score":0.3 + "score":0.6867971436 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"rw", - "task":"mmlu", - "metric":"accuracy", - "score":0.0 - }, - { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"rw", "task":"translation_from", "metric":"bleu", - "score":0.1701995093 + "score":0.3354195212 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"rw", "task":"translation_from", "metric":"chrf", - "score":0.4262662427 + "score":0.5741211618 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"rw", "task":"translation_to", "metric":"bleu", - "score":0.1513262342 + "score":0.3462677897 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"rw", "task":"translation_to", "metric":"chrf", - "score":0.4732082637 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sd", - "task":"classification", - "metric":"accuracy", - "score":1.0 + "score":0.5833767681 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"sd", "task":"translation_from", "metric":"bleu", - "score":0.2365858071 + "score":0.3412028977 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"sd", "task":"translation_from", "metric":"chrf", - "score":0.4722212406 + "score":0.5889369863 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"sd", "task":"translation_to", "metric":"bleu", - "score":0.2251623508 + "score":0.3852572206 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"sd", "task":"translation_to", "metric":"chrf", - "score":0.4159341653 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"si", - "task":"classification", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"si", - "task":"mmlu", - "metric":"accuracy", - "score":0.4 + "score":0.5784169857 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"si", "task":"translation_from", "metric":"bleu", - "score":0.226689844 + "score":0.2698751119 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"si", "task":"translation_from", "metric":"chrf", - "score":0.4706510499 + "score":0.5340401081 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"si", "task":"translation_to", "metric":"bleu", - "score":0.2258552473 + "score":0.4096366215 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"si", "task":"translation_to", "metric":"chrf", - "score":0.4191499082 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sn", - "task":"classification", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sn", - "task":"mgsm", - "metric":"accuracy", - "score":0.4 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sn", - "task":"mmlu", - "metric":"accuracy", - "score":0.5 + "score":0.5525266748 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"sn", "task":"translation_from", "metric":"bleu", - "score":0.0756830418 + "score":0.256568307 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"sn", "task":"translation_from", "metric":"chrf", - "score":0.3184767575 + "score":0.4900607089 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"sn", "task":"translation_to", "metric":"bleu", - "score":0.0495523985 + "score":0.1305127177 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"sn", "task":"translation_to", "metric":"chrf", - "score":0.3971096934 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"so", - "task":"classification", - "metric":"accuracy", - "score":1.0 + "score":0.4214140091 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"so", - "task":"mmlu", - "metric":"accuracy", - "score":0.5 - }, - { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"so", "task":"translation_from", "metric":"bleu", - "score":0.1915993132 + "score":0.3156233999 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"so", "task":"translation_from", "metric":"chrf", - "score":0.4208812642 + "score":0.5490670273 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"so", "task":"translation_to", "metric":"bleu", - "score":0.1724511246 + "score":0.1872166048 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"so", "task":"translation_to", "metric":"chrf", - "score":0.4741419887 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sr", - "task":"classification", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sr", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 + "score":0.4920219369 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"sr", "task":"translation_from", "metric":"bleu", - "score":0.245439349 + "score":0.321113344 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"sr", "task":"translation_from", "metric":"chrf", - "score":0.536270172 + "score":0.5864222708 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"sr", "task":"translation_to", "metric":"bleu", - "score":0.3929818488 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sr", - "task":"translation_to", - "metric":"chrf", - "score":0.5787667028 + "score":0.4884555721 }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"su", - "task":"classification", - "metric":"accuracy", - "score":1.0 + { + "model":"google\/translate-v2", + "bcp_47":"sr", + "task":"translation_to", + "metric":"chrf", + "score":0.6556325596 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"su", "task":"translation_from", "metric":"bleu", - "score":0.1784974236 + "score":0.352233215 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"su", "task":"translation_from", "metric":"chrf", - "score":0.4520828188 + "score":0.5470765309 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"su", "task":"translation_to", "metric":"bleu", - "score":0.1435021957 + "score":0.1904552367 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"su", "task":"translation_to", "metric":"chrf", - "score":0.4868234587 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sv", - "task":"classification", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sv", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sv", - "task":"mmlu", - "metric":"accuracy", - "score":0.5 + "score":0.4562964405 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"sv", "task":"translation_from", "metric":"bleu", - "score":0.3258404036 + "score":0.3843214006 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"sv", "task":"translation_from", "metric":"chrf", - "score":0.5652149653 + "score":0.6136910044 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"sv", "task":"translation_to", "metric":"bleu", - "score":0.4264864443 + "score":0.4689482853 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"sv", "task":"translation_to", "metric":"chrf", - "score":0.6543542662 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"classification", - "metric":"accuracy", - "score":1.0 + "score":0.6877930778 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"sw", - "task":"mmlu", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"sw", "task":"translation_from", "metric":"bleu", - "score":0.268709657 + "score":0.4161610215 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"sw", "task":"translation_from", "metric":"chrf", - "score":0.5306834056 + "score":0.6455274177 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"sw", "task":"translation_to", "metric":"bleu", - "score":0.3395981599 + "score":0.5117468349 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"sw", "task":"translation_to", "metric":"chrf", - "score":0.6130756934 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ta", - "task":"classification", - "metric":"accuracy", - "score":1.0 + "score":0.7232937985 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ta", "task":"translation_from", "metric":"bleu", - "score":0.2563448403 + "score":0.3318364746 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ta", "task":"translation_from", "metric":"chrf", - "score":0.5007966916 + "score":0.5738929543 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ta", "task":"translation_to", "metric":"bleu", - "score":0.2405135195 + "score":0.3895968702 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ta", "task":"translation_to", "metric":"chrf", - "score":0.5564984925 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"classification", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"mgsm", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"te", - "task":"mmlu", - "metric":"accuracy", - "score":0.2 + "score":0.6277778554 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"te", "task":"translation_from", "metric":"bleu", - "score":0.2787922254 + "score":0.4077995927 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"te", "task":"translation_from", "metric":"chrf", - "score":0.5420797212 + "score":0.6409257804 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"te", "task":"translation_to", "metric":"bleu", - "score":0.259866454 + "score":0.485273374 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"te", "task":"translation_to", "metric":"chrf", - "score":0.48543634 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tg", - "task":"classification", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tg", - "task":"translation_from", - "metric":"bleu", - "score":0.2018690154 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tg", - "task":"translation_from", - "metric":"chrf", - "score":0.4335923466 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tg", - "task":"translation_to", - "metric":"bleu", - "score":0.0972794658 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tg", - "task":"translation_to", - "metric":"chrf", - "score":0.327182503 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"classification", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"th", - "task":"mgsm", - "metric":"accuracy", - "score":1.0 + "score":0.6710025354 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"th", "task":"translation_from", "metric":"bleu", - "score":0.2400131449 + "score":0.3269754516 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"th", "task":"translation_from", "metric":"chrf", - "score":0.4851690277 + "score":0.5639027355 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"th", "task":"translation_to", "metric":"bleu", - "score":0.383380628 + "score":0.465639801 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"th", "task":"translation_to", "metric":"chrf", - "score":0.5430720239 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ti", - "task":"classification", - "metric":"accuracy", - "score":1.0 + "score":0.597395155 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ti", "task":"translation_from", "metric":"bleu", - "score":0.0736674948 + "score":0.2639320429 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ti", "task":"translation_from", "metric":"chrf", - "score":0.2974206944 + "score":0.5034191891 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ti", "task":"translation_to", "metric":"bleu", - "score":0.0241026131 + "score":0.2139020366 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ti", "task":"translation_to", "metric":"chrf", - "score":0.1246172628 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"classification", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"mmlu", - "metric":"accuracy", - "score":0.4 + "score":0.3242506245 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"tr", "task":"translation_from", "metric":"bleu", - "score":0.2757340333 + "score":0.3693666266 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"tr", "task":"translation_from", "metric":"chrf", - "score":0.5244536559 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"tr", - "task":"translation_to", - "metric":"bleu", - "score":0.3185578758 + "score":0.6134245868 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"tr", "task":"translation_to", - "metric":"chrf", - "score":0.5765088485 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"uk", - "task":"classification", - "metric":"accuracy", - "score":0.9 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"uk", - "task":"mmlu", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"uk", - "task":"translation_from", - "metric":"bleu", - "score":0.2918547905 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"uk", - "task":"translation_from", - "metric":"chrf", - "score":0.5631912653 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"uk", - "task":"translation_to", - "metric":"bleu", - "score":0.3283437369 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"uk", - "task":"translation_to", - "metric":"chrf", - "score":0.5565790802 + "metric":"bleu", + "score":0.3936947375 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"umb", - "task":"classification", - "metric":"accuracy", - "score":0.4 + "model":"google\/translate-v2", + "bcp_47":"tr", + "task":"translation_to", + "metric":"chrf", + "score":0.6497039072 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"umb", + "model":"google\/translate-v2", + "bcp_47":"uk", "task":"translation_from", "metric":"bleu", - "score":0.0359452883 + "score":0.2907704167 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"umb", + "model":"google\/translate-v2", + "bcp_47":"uk", "task":"translation_from", "metric":"chrf", - "score":0.1779043042 + "score":0.5698553329 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"umb", + "model":"google\/translate-v2", + "bcp_47":"uk", "task":"translation_to", "metric":"bleu", - "score":0.0305779168 + "score":0.4401277302 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"umb", + "model":"google\/translate-v2", + "bcp_47":"uk", "task":"translation_to", "metric":"chrf", - "score":0.1838354035 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"ur", - "task":"classification", - "metric":"accuracy", - "score":0.9 + "score":0.6278421339 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ur", "task":"translation_from", "metric":"bleu", - "score":0.2595582459 + "score":0.3080488172 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ur", "task":"translation_from", "metric":"chrf", - "score":0.5043992681 + "score":0.5695112482 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ur", "task":"translation_to", "metric":"bleu", - "score":0.2142625601 + "score":0.3188563568 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"ur", "task":"translation_to", "metric":"chrf", - "score":0.429749938 + "score":0.5116789278 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"uz", - "task":"classification", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"uz", "task":"translation_from", "metric":"bleu", - "score":0.2595944841 + "score":0.273125871 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"uz", "task":"translation_from", "metric":"chrf", - "score":0.5081810113 + "score":0.5508470442 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"uz", "task":"translation_to", "metric":"bleu", - "score":0.2601189518 + "score":0.3030324343 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"uz", "task":"translation_to", "metric":"chrf", - "score":0.5225655991 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"classification", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"vi", - "task":"mmlu", - "metric":"accuracy", - "score":0.4 + "score":0.5648891805 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"vi", "task":"translation_from", "metric":"bleu", - "score":0.2279880384 + "score":0.3603047797 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"vi", "task":"translation_from", "metric":"chrf", - "score":0.4835933272 + "score":0.5927521365 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"vi", "task":"translation_to", "metric":"bleu", - "score":0.3478085621 + "score":0.4395780689 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"vi", "task":"translation_to", "metric":"chrf", - "score":0.5968604742 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"wo", - "task":"classification", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"wo", - "task":"mgsm", - "metric":"accuracy", - "score":0.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"wo", - "task":"mmlu", - "metric":"accuracy", - "score":0.2 + "score":0.6552870615 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"wo", "task":"translation_from", "metric":"bleu", - "score":0.065945115 + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"wo", "task":"translation_from", "metric":"chrf", - "score":0.2358663461 + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"wo", "task":"translation_to", "metric":"bleu", - "score":0.0540055322 + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"wo", "task":"translation_to", "metric":"chrf", - "score":0.2390749172 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"wuu", - "task":"classification", - "metric":"accuracy", - "score":1.0 + "score":0.0 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"wuu", "task":"translation_from", "metric":"bleu", - "score":0.246042863 + "score":0.3662176152 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"wuu", "task":"translation_from", "metric":"chrf", - "score":0.4917114856 + "score":0.5856640284 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"wuu", "task":"translation_to", "metric":"bleu", - "score":0.1017188886 + "score":0.1500486487 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"wuu", "task":"translation_to", "metric":"chrf", - "score":0.1707828137 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"xh", - "task":"classification", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"xh", - "task":"mgsm", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"xh", - "task":"mmlu", - "metric":"accuracy", - "score":0.4 + "score":0.2162606152 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"xh", "task":"translation_from", "metric":"bleu", - "score":0.167004472 + "score":0.3163153725 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"xh", "task":"translation_from", "metric":"chrf", - "score":0.400944552 + "score":0.5712728237 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"xh", "task":"translation_to", "metric":"bleu", - "score":0.066271851 + "score":0.1386875315 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"xh", "task":"translation_to", "metric":"chrf", - "score":0.3937495329 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yo", - "task":"classification", - "metric":"accuracy", - "score":0.7 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yo", - "task":"mgsm", - "metric":"accuracy", - "score":0.2 + "score":0.469849511 }, { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yo", - "task":"mmlu", - "metric":"accuracy", - "score":0.2 - }, - { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"yo", "task":"translation_from", "metric":"bleu", - "score":0.0472060067 + "score":0.1925403782 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"yo", "task":"translation_from", "metric":"chrf", - "score":0.2924612708 + "score":0.4228528325 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"yo", "task":"translation_to", "metric":"bleu", - "score":0.0525309984 + "score":0.0437670613 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"yo", "task":"translation_to", "metric":"chrf", - "score":0.2304098638 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"yue", - "task":"classification", - "metric":"accuracy", - "score":1.0 + "score":0.2053727616 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"yue", "task":"translation_from", "metric":"bleu", - "score":0.2124709579 + "score":0.2311956685 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"yue", "task":"translation_from", "metric":"chrf", - "score":0.4811646042 + "score":0.5099861434 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"yue", "task":"translation_to", "metric":"bleu", - "score":0.1392232 + "score":0.281120015 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"yue", "task":"translation_to", "metric":"chrf", - "score":0.2205120991 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"classification", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"mgsm", - "metric":"accuracy", - "score":0.8 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zh", - "task":"mmlu", - "metric":"accuracy", - "score":0.5 + "score":0.3263629293 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"zh", "task":"translation_from", "metric":"bleu", - "score":0.1900086584 + "score":0.3441147842 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"zh", "task":"translation_from", "metric":"chrf", - "score":0.4895930442 + "score":0.6121137924 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"zh", "task":"translation_to", "metric":"bleu", - "score":0.2395565562 + "score":0.4192686299 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"zh", "task":"translation_to", "metric":"chrf", - "score":0.3237759485 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zu", - "task":"classification", - "metric":"accuracy", - "score":1.0 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zu", - "task":"mgsm", - "metric":"accuracy", - "score":0.6 - }, - { - "model":"google\/gemma-3-27b-it", - "bcp_47":"zu", - "task":"mmlu", - "metric":"accuracy", - "score":0.4 + "score":0.4558586669 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"zu", "task":"translation_from", "metric":"bleu", - "score":0.1607803472 + "score":0.353693059 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"zu", "task":"translation_from", "metric":"chrf", - "score":0.4377738064 + "score":0.607730412 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"zu", "task":"translation_to", "metric":"bleu", - "score":0.1538390263 + "score":0.3303018306 }, { - "model":"google\/gemma-3-27b-it", + "model":"google\/translate-v2", "bcp_47":"zu", "task":"translation_to", "metric":"chrf", - "score":0.4751516021 + "score":0.5960312224 }, { "model":"gryphe\/mythomax-l2-13b",